Spaces:

Rudra16t
/

HexAI_Demo

Paused

App Files Files Community

Ankit Thakur commited on Jul 18, 2025

Commit

c57fdf3

1 Parent(s): bf85b2f

everything

Browse files

Files changed (4) hide show

app.py +52 -99
config.py +21 -22
requirements.txt +11 -11
validate_prescription.py +87 -286

app.py CHANGED Viewed

@@ -1,137 +1,90 @@
 import os
 import streamlit as st
-from PIL import Image
-from config import (
-    STATIC_DIR,
-    UPLOADS_DIR,
-    HF_TOKEN,
-    GOOGLE_API_KEY,
-    GOOGLE_CSE_ID,
-    GEMINI_API_KEY,
-    DEVICE
-)
-# ─── App Configuration ────────────────────────────────────────────────────
-st.set_page_config(
-    page_title="RxGuard Prescription Validator",
-    page_icon="⚕️",
-    layout="wide",
-    menu_items={
-        'Get Help': 'https://github.com/your-repo',
-        'About': "RxGuard v1.0 - Advanced Prescription Validation"
-    }
-)
-# ─── Session State ────────────────────────────────────────────────────────
 if "analysis_result" not in st.session_state:
     st.session_state.analysis_result = None
 if "uploaded_filename" not in st.session_state:
     st.session_state.uploaded_filename = None
-# ─── UI Components ────────────────────────────────────────────────────────
 def show_service_status():
     """Displays service connectivity status."""
-    cols = st.columns(4)
-    with cols[0]:
-        st.metric("HuggingFace", "✅" if HF_TOKEN else "❌")
-    with cols[1]:
-        st.metric("Google API", "✅" if GOOGLE_API_KEY else "❌")
-    with cols[2]:
-        st.metric("Gemini", "✅" if GEMINI_API_KEY else "❌")
-    with cols[3]:
-        st.metric("Device", DEVICE.upper())
-def display_patient_info(info: dict):
-    """Displays patient information in a formatted card."""
-    with st.container(border=True):
-        st.subheader("👤 Patient Details")
-        cols = st.columns(2)
-        with cols[0]:
-            st.markdown(f"**Name:** {info.get('Name', 'Not detected')}")
-            st.markdown(f"**Age:** {info.get('Age', 'N/A')}")
-        with cols[1]:
-            st.markdown(f"**Date:** {info.get('Date', 'N/A')}")
-            st.markdown(f"**Physician:** {info.get('PhysicianName', 'N/A')}")
-def display_medications(medications: list):
-    """Displays medication information with verification."""
-    st.subheader("💊 Medications")
-    if not medications:
-        st.warning("No medications detected in prescription")
-        return
-    for med in medications:
-        with st.expander(f"{med.get('drug_raw', 'Unknown Medication')}"):
-            cols = st.columns([1, 2])
-            with cols[0]:
-                st.markdown(f"""
-                **Dosage:** `{med.get('dosage', 'N/A')}`
-                **Frequency:** `{med.get('frequency', 'N/A')}`
-                """)
-            with cols[1]:
-                if verification := med.get("verification"):
-                    if dosage := verification.get("standard_dosage"):
-                        st.success(f"**Standard Dosage:** {dosage}")
-                    if side_effects := verification.get("side_effects"):
-                        st.warning(f"**Side Effects:** {side_effects}")
-                    if interactions := verification.get("interactions"):
-                        st.error(f"**Interactions:** {interactions}")
-# ─── Main Application ─────────────────────────────────────────────────────
 def main():
     st.title("⚕️ RxGuard Prescription Validator")
-    st.caption("AI-powered prescription verification system")
     show_service_status()
     # Only enable upload if required services are available
-    if all([HF_TOKEN, GOOGLE_API_KEY, GEMINI_API_KEY]):
         uploaded_file = st.file_uploader(
-            "Upload prescription image (PNG/JPG/JPEG):",
             type=["png", "jpg", "jpeg"],
-            help="Clear image of the prescription"
         )
         if uploaded_file and uploaded_file.name != st.session_state.uploaded_filename:
             with st.status("Analyzing prescription...", expanded=True) as status:
                 try:
-                    # Store the uploaded file
                     st.session_state.uploaded_filename = uploaded_file.name
                     file_path = os.path.join(UPLOADS_DIR, uploaded_file.name)
                     with open(file_path, "wb") as f:
                         f.write(uploaded_file.getvalue())
-                    # Import processing function only when needed
                     from validate_prescription import extract_prescription_info
                     st.session_state.analysis_result = extract_prescription_info(file_path)
                     status.update(label="Analysis complete!", state="complete", expanded=False)
                 except Exception as e:
-                    st.error(f"Processing failed: {str(e)}")
                     st.session_state.analysis_result = {"error": str(e)}
                     status.update(label="Analysis failed", state="error")
-    # Display results if available
-    if st.session_state.analysis_result:
-        result = st.session_state.analysis_result
-        if result.get("error"):
-            st.error(f"❌ Error: {result['error']}")
         else:
-            tab1, tab2 = st.tabs(["Patient Information", "Medication Details"])
             with tab1:
-                if uploaded_file:
-                    st.image(uploaded_file, use_column_width=True)
-                display_patient_info(result["info"])
             with tab2:
-                display_medications(result["info"].get("Medications", []))
-                if st.toggle("Show technical details"):
-                    st.json(result.get("debug_info", {}))
 if __name__ == "__main__":
     main()

 import os
 import streamlit as st
+from config import STATIC_DIR, HF_TOKEN, GOOGLE_API_KEY, DEVICE
+# App Configuration
+st.set_page_config(page_title="RxGuard Prescription Validator", page_icon="⚕️", layout="wide")
+# Initialize directories and session state
+UPLOADS_DIR = os.path.join(STATIC_DIR, "uploads")
+os.makedirs(UPLOADS_DIR, exist_ok=True)
 if "analysis_result" not in st.session_state:
     st.session_state.analysis_result = None
 if "uploaded_filename" not in st.session_state:
     st.session_state.uploaded_filename = None
 def show_service_status():
     """Displays service connectivity status."""
+    st.caption("Service Status")
+    cols = st.columns(3)
+    cols[0].metric("HuggingFace Models", "✅" if HF_TOKEN else "❌")
+    cols[1].metric("Google AI Services", "✅" if GOOGLE_API_KEY else "❌")
+    cols[2].metric("Hardware Accelerator", DEVICE.upper())
+    st.divider()
 def main():
     st.title("⚕️ RxGuard Prescription Validator")
+    st.caption("Advanced, multi-source AI verification system")
     show_service_status()
     # Only enable upload if required services are available
+    if all([HF_TOKEN, GOOGLE_API_KEY]):
         uploaded_file = st.file_uploader(
+            "Upload a prescription image (PNG/JPG/JPEG):",
             type=["png", "jpg", "jpeg"],
+            help="Upload a clear image of the prescription for analysis."
         )
         if uploaded_file and uploaded_file.name != st.session_state.uploaded_filename:
             with st.status("Analyzing prescription...", expanded=True) as status:
                 try:
                     st.session_state.uploaded_filename = uploaded_file.name
                     file_path = os.path.join(UPLOADS_DIR, uploaded_file.name)
                     with open(file_path, "wb") as f:
                         f.write(uploaded_file.getvalue())
+                    # Lazily import the processing function
                     from validate_prescription import extract_prescription_info
                     st.session_state.analysis_result = extract_prescription_info(file_path)
                     status.update(label="Analysis complete!", state="complete", expanded=False)
                 except Exception as e:
+                    st.error(f"A critical error occurred during processing: {str(e)}")
                     st.session_state.analysis_result = {"error": str(e)}
                     status.update(label="Analysis failed", state="error")
+    else:
+        st.error("Missing API Keys. Please configure HF_TOKEN and GOOGLE_API_KEY in your Space secrets.")
+    # Display results if available in the session state
+    if result := st.session_state.get("analysis_result"):
+        if error := result.get("error"):
+            st.error(f"❌ Analysis Error: {error}")
         else:
+            info = result.get("info", {})
+            tab1, tab2 = st.tabs(["**👤 Patient & Prescription Info**", "**⚙️ Technical Details**"])
             with tab1:
+                col1, col2 = st.columns([1, 2])
+                with col1:
+                    if uploaded_file:
+                        st.image(uploaded_file, use_column_width=True, caption="Uploaded Prescription")
+                with col2:
+                    st.subheader("Patient Details")
+                    st.info(f"**Name:** {info.get('Name', 'Not detected')}")
+                    st.info(f"**Age:** {info.get('Age', 'N/A')}")
+                    st.subheader("Prescription Details")
+                    st.info(f"**Date:** {info.get('Date', 'N/A')}")
+                    st.info(f"**Physician:** {info.get('PhysicianName', 'N/A')}")
+                st.divider()
+                st.subheader("💊 Medications")
+                for med in info.get("Medications", []):
+                    st.success(f"**Drug:** {med.get('drug_raw')} | **Dosage:** {med.get('dosage', 'N/A')} | **Frequency:** {med.get('frequency', 'N/A')}")
             with tab2:
+                st.subheader("Debug Information from AI Pipeline")
+                st.json(result.get("debug_info", {}))
 if __name__ == "__main__":
     main()

config.py CHANGED Viewed

@@ -2,37 +2,36 @@ import os
 import torch
 from dotenv import load_dotenv
 load_dotenv()
-# ─── Directory Configuration ────────────────────────────────────────────────
 BASE_DIR = os.path.dirname(os.path.abspath(__file__))
 STATIC_DIR = os.path.join(BASE_DIR, 'static')
 os.makedirs(STATIC_DIR, exist_ok=True)
-# ─── API Secrets ────────────────────────────────────────────────────────────
-HF_TOKEN = os.getenv("HUGGINGFACE_HUB_TOKEN")  # For Hugging Face models
-GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")  # For Gemini and Custom Search
-GOOGLE_CSE_ID = os.getenv("GOOGLE_CSE_ID")  # For medication verification
-GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")  # Alternative Gemini auth
-HALODOC_API_KEY = os.getenv("HALODOC_API_KEY")  # Future integration
 GOOGLE_APPLICATION_CREDENTIALS = os.getenv("GOOGLE_APPLICATION_CREDENTIALS")
-# ─── Model Configuration ────────────────────────────────────────────────────
 HF_MODELS = {
-    "donut": "naver-clova-ix/donut-base-finetuned-cord-v2",
-    "phi3": "microsoft/phi-3-mini-4k-instruct",
 }
-GEMINI_MODEL_NAME = "gemini-1.5-flash"  # Balanced for speed and accuracy
-# ─── Processing Parameters ─────────────────────────────────────────────────
-LEV_THRESH = 0.75  # Levenshtein similarity threshold
-SIG_THRESH = 0.65  # Signature verification threshold
-# ─── File Paths ───────────────────────────────────────────────────────────
 DB_PATH = os.path.join(STATIC_DIR, "rxguard.db")
-UPLOADS_DIR = os.path.join(STATIC_DIR, "uploads")
-os.makedirs(UPLOADS_DIR, exist_ok=True)
-# ─── Hardware Configuration ────────────────────────────────────────────────
-DEVICE = "cpu"  # Force CPU for Hugging Face Spaces compatibility
-USE_GPU = False

 import torch
 from dotenv import load_dotenv
+# Load environment variables from a .env file if it exists
 load_dotenv()
+# ─── Environment & Directory Setup ────────────────────────────────────────────
 BASE_DIR = os.path.dirname(os.path.abspath(__file__))
 STATIC_DIR = os.path.join(BASE_DIR, 'static')
 os.makedirs(STATIC_DIR, exist_ok=True)
+# ─── Hardware Configuration ───────────────────────────────────────────────────
+# Automatically use GPU if available (recommended for Hugging Face Spaces with T4)
+USE_GPU = torch.cuda.is_available()
+DEVICE = "cuda" if USE_GPU else "cpu"
+# ─── API & Model Configuration ────────────────────────────────────────────────
+# API Keys should be set as Secrets in your Hugging Face Space
+HF_TOKEN = os.getenv("HF_TOKEN")
+GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")
 GOOGLE_APPLICATION_CREDENTIALS = os.getenv("GOOGLE_APPLICATION_CREDENTIALS")
+# Model IDs for the hybrid pipeline
 HF_MODELS = {
+    # Layout-aware model for initial structured extraction
+    "donut": "Javeria98/donut-base-Medical_Handwritten_Prescriptions_Information_Extraction_Final_model1",
+    # Small, powerful model for re-parsing medication details
+    "phi3": "Muizzzz8/phi3-prescription-reader"
 }
+# Final resolver model
+GEMINI_MODEL_NAME = "gemini-1.5-flash"
+# ─── File Paths (can be used for other utilities) ─────────────────────────────
 DB_PATH = os.path.join(STATIC_DIR, "rxguard.db")
+SIGNATURES_DIR = os.path.join(STATIC_DIR, "signatures")
+os.makedirs(SIGNATURES_DIR, exist_ok=True)

requirements.txt CHANGED Viewed

@@ -1,23 +1,23 @@
 # Core
 streamlit==1.36.0
 python-dotenv==1.0.1
-# AI & Vision
-# Using Google's recommended versions for Gemini and Vision
 google-generativeai==0.7.1
-google-cloud-vision==3.7.3
 torch==2.3.1
-pillow==10.3.0
-transformers==4.41.0
-# OCR
 paddleocr==2.7.3
-# Using the CPU version of paddlepaddle for broader compatibility on HF Spaces
 paddlepaddle==2.6.1
 # Utils
 numpy==1.26.4
-requests==2.32.3
-opencv-python-headless==4.10.0.84
-scikit-image==0.22.0
-pytz==2024.1

 # Core
 streamlit==1.36.0
 python-dotenv==1.0.1
+pandas==2.2.2
+# AI & Vision - Google
 google-generativeai==0.7.1
+# AI & Vision - Hugging Face (for T4 GPU with CUDA 12.1)
+--extra-index-url https://download.pytorch.org/whl/cu121
 torch==2.3.1
+transformers==4.42.3
+accelerate==0.31.0
+bitsandbytes==0.43.1
+sentencepiece==0.2.0
+# OCR (as a potential fallback or utility)
 paddleocr==2.7.3
 paddlepaddle==2.6.1
 # Utils
 numpy==1.26.4
+Pillow==10.3.0

validate_prescription.py CHANGED Viewed

@@ -2,23 +2,17 @@ import os
 import re
 import json
 import logging
-import time
-import numpy as np
 import tempfile
-import sqlite3
 import torch
-import io
-from typing import Dict, Any, List, Optional
 from PIL import Image
-from dotenv import load_dotenv
-from googleapiclient.discovery import build
 # Suppress verbose backend logs
 os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"
-load_dotenv()
 try:
-    from transformers import pipeline, DonutProcessor, VisionEncoderDecoderModel, AutoTokenizer
     from huggingface_hub import login
     import google.generativeai as genai
 except ImportError as e:
@@ -26,68 +20,25 @@ except ImportError as e:
     raise
 from config import (
-    DB_PATH,
-    HF_TOKEN,
-    HF_MODELS,
-    GOOGLE_API_KEY,
-    GOOGLE_APPLICATION_CREDENTIALS,
-    GEMINI_MODEL_NAME,
-    DEVICE,
-    USE_GPU,
-    GOOGLE_CSE_ID,
 )
-# ─── Configure Logging & Auth ────────────────────────────────────────────────
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
-if HF_TOKEN:
-    login(token=HF_TOKEN)
-# ─── Singleton Holders for AI Models ─────────────────────────────────────────
-_MODELS = {}
-_TEMP_CRED_FILE = None
-class GoogleSearch:
-    """Performs Google Custom Search API queries."""
     def __init__(self):
-        self.api_key = GOOGLE_API_KEY
-        self.cse_id = GOOGLE_CSE_ID
-        self.service = None
-        if self.api_key and self.cse_id:
-            try:
-                self.service = build("customsearch", "v1", developerKey=self.api_key)
-                logging.info("Google Custom Search initialized.")
-            except Exception as e:
-                logging.error(f"CSE init failed: {e}")
-        else:
-            logging.warning("GOOGLE_API_KEY or GOOGLE_CSE_ID not set; search disabled.")
-    def search(self, queries: list, num_results: int = 1) -> list:
-        if not self.service:
-            return []
-        out = []
-        for q in queries:
-            try:
-                resp = self.service.cse().list(q=q, cx=self.cse_id, num=num_results).execute()
-                items = resp.get("items", [])
-                formatted = [
-                    {"title": it.get("title"), "link": it.get("link"), "snippet": it.get("snippet")}
-                    for it in items
-                ]
-                out.append({"query": q, "results": formatted})
-            except Exception as e:
-                logging.error(f"Search error for '{q}': {e}")
-                out.append({"query": q, "results": []})
-        return out
-# Initialize Google Search globally
-google_search = GoogleSearch()
-def get_model(name: str):
-    """Loads and caches AI models to avoid reloading."""
-    if name not in _MODELS:
         model_id = HF_MODELS.get(name)
-        if not model_id:
-            return None
         logging.info(f"Loading model '{name}' ({model_id}) to device '{DEVICE}'...")
         try:
@@ -95,242 +46,92 @@ def get_model(name: str):
             if name == "donut":
                 processor = DonutProcessor.from_pretrained(model_id)
                 model = VisionEncoderDecoderModel.from_pretrained(model_id, **quantization_config)
-                _MODELS[name] = {"model": model, "processor": processor}
             elif name == "phi3":
-                model = pipeline(
-                    "text-generation",
-                    model=model_id,
-                    torch_dtype=torch.bfloat16,
-                    trust_remote_code=True,
-                    **quantization_config
-                )
-                _MODELS[name] = {"model": model}
             logging.info(f"Model '{name}' loaded successfully.")
         except Exception as e:
             logging.error(f"Failed to load model '{name}': {e}", exc_info=True)
-            _MODELS[name] = None
-    return _MODELS.get(name)
-def get_gemini_client():
-    """Initializes and returns the Gemini client."""
-    global _TEMP_CRED_FILE
-    if "gemini" not in _MODELS:
-        # Write out credentials file if needed
         if creds_json_str := GOOGLE_APPLICATION_CREDENTIALS:
-            if not _TEMP_CRED_FILE or not os.path.exists(_TEMP_CRED_FILE):
                 with tempfile.NamedTemporaryFile(mode="w", delete=False, suffix=".json") as tfp:
                     tfp.write(creds_json_str)
-                    _TEMP_CRED_FILE = tfp.name
-                os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = _TEMP_CRED_FILE
         try:
             genai.configure(api_key=GOOGLE_API_KEY)
-            _MODELS["gemini"] = genai.GenerativeModel(GEMINI_MODEL_NAME)
         except Exception as e:
             logging.error(f"Gemini init failed: {e}")
-            _MODELS["gemini"] = None
-    return _MODELS.get("gemini")
-def verify_medication_with_google(medication_name: str) -> Dict[str, Any]:
-    """Verifies medication details using Google Search API."""
-    if not medication_name:
-        return {"error": "No medication name provided"}
-    queries = [
-        f"standard dosage for {medication_name}",
-        f"side effects of {medication_name}",
-        f"drug interactions with {medication_name}"
-    ]
-    search_results = google_search.search(queries, num_results=2)
-    return {
-        "medication": medication_name,
-        "verification_results": search_results
-    }
-def step1_run_donut(image: Image.Image) -> Dict[str, Any]:
-    donut_components = get_model("donut")
-    if not donut_components:
-        return {"error": "Donut model not available."}
-    model = donut_components["model"].to(DEVICE)
-    processor = donut_components["processor"]
-    task_prompt = "<s_cord-v2>"
-    decoder_input_ids = processor.tokenizer(
-        task_prompt, add_special_tokens=False, return_tensors="pt"
-    ).input_ids.to(DEVICE)
-    pixel_values = processor(image, return_tensors="pt").pixel_values.to(DEVICE)
-    outputs = model.generate(
-        pixel_values,
-        decoder_input_ids=decoder_input_ids,
-        max_length=model.decoder.config.max_position_embeddings,
-        early_stopping=True,
-        use_cache=True,
-        num_beams=1,
-        bad_words_ids=[[processor.tokenizer.unk_token_id]],
-        return_dict_in_generate=True,
-    )
-    sequence = (
-        processor.batch_decode(outputs.sequences)[0]
-        .replace(processor.tokenizer.eos_token, "")
-        .replace(processor.tokenizer.pad_token, "")
-    )
-    return processor.token2json(sequence)
-def step2_run_phi3(medication_text: str) -> str:
-    phi3_components = get_model("phi3")
-    if not phi3_components:
-        return medication_text
-    pipe = phi3_components["model"]
-    prompt = (
-        f"Normalize the following prescription medication line into its components "
-        f"(drug, dosage, frequency). Raw text: '{medication_text}'"
-    )
-    outputs = pipe(prompt, max_new_tokens=100, do_sample=False)
-    return outputs[0]["generated_text"].split("Normalized:")[-1].strip()
-def step3_run_gemini_resolver(
-    image: Image.Image, donut_result: Dict[str, Any], phi3_results: List[str]
-) -> Dict[str, Any]:
-    gemini_client = get_gemini_client()
-    if not gemini_client:
-        return {"error": "Gemini resolver not available."}
-    prompt = f"""
-You are an expert pharmacist's assistant whose sole objective is to reconcile and verify prescription details by cross-referencing multiple AI model outputs against the original prescription image (the ultimate source of truth).
-Attached Inputs:
-1. Prescription image file
-2. Donut Model Output (layout-aware):
-   {json.dumps(donut_result, indent=2)}
-3. Phi-3 Model Output (medication refinement):
-   {json.dumps(phi3_results, indent=2)}
-Please follow these steps **in order**:
-1. **Extract & Normalize**
-   - Read the prescription image and extract: Patient Name, Date, Age, Physician Name, and each listed medication.
-   - Normalize dates to MM/DD/YYYY and medication names to their exact printed form.
-2. **Compare Model Outputs**
-   - For each field (Name, Date, Age, PhysicianName), check both model outputs and flag any discrepancies.
-   - For each medication entry, compare `drug_raw`, `dosage`, and `frequency` from Phi-3 with the layout cues from Donut.
-3. **Verify Against Image**
-   - Wherever the two models disagree, use the image text as the tiebreaker.
-   - If both models miss or misread something (e.g. a dosage or frequency), pull it directly from the image.
-4. **Error Correction**
-   - Correct spelling errors, unit inconsistencies (e.g. "mg" vs "MG"), and frequency shorthand (e.g. "BID" → "twice a day").
-5. **Assemble Final JSON**
-   - Populate exactly this schema; do not add extra keys.
-   - If a field is unreadable or absent on the image, set its value to `null`.
-**Final JSON Schema**
-```json
-{{
-  "Name": "string or null",
-  "Date": "string (MM/DD/YYYY) or null",
-  "Age": "string or null",
-  "PhysicianName": "string or null",
-  "Medications": [
-    {{
-      "drug_raw": "string",
-      "dosage": "string or null",
-      "frequency": "string or null",
-      "verification": {{
-        "standard_dosage": "string or null",
-        "side_effects": "string or null",
-        "interactions": "string or null"
-      }}
-    }}
-  ]
-}}
-"""
-    try:
-        response = gemini_client.generate_content(
-            [prompt, image],
-            generation_config={"response_mime_type": "application/json"},
-        )
-        result = json.loads(response.text)
-        # Enhance with Google Search verification
-        for med in result.get("Medications", []):
-            if drug_name := med.get("drug_raw"):
-                verification = verify_medication_with_google(drug_name)
-                med["verification"] = {
-                    "standard_dosage": self._extract_dosage_info(verification),
-                    "side_effects": self._extract_side_effects(verification),
-                    "interactions": self._extract_interactions(verification)
-                }
-        return result
-    except Exception as e:
-        logging.error(f"Gemini resolver failed: {e}")
-        return {"error": f"Gemini failed to resolve data: {e}"}
-def _extract_dosage_info(verification_data: Dict) -> Optional[str]:
-    """Extracts dosage information from verification results."""
-    for result in verification_data.get("verification_results", []):
-        if "standard dosage" in result.get("query", "").lower():
-            return result.get("results", [{}])[0].get("snippet")
-    return None
-def _extract_side_effects(verification_data: Dict) -> Optional[str]:
-    """Extracts side effects information from verification results."""
-    for result in verification_data.get("verification_results", []):
-        if "side effects" in result.get("query", "").lower():
-            return result.get("results", [{}])[0].get("snippet")
-    return None
-def _extract_interactions(verification_data: Dict) -> Optional[str]:
-    """Extracts drug interactions information from verification results."""
-    for result in verification_data.get("verification_results", []):
-        if "interactions" in result.get("query", "").lower():
-            return result.get("results", [{}])[0].get("snippet")
-    return None
 def extract_prescription_info(image_path: str) -> Dict[str, Any]:
-    """Runs the full hybrid AI pipeline."""
-    try:
-        image = Image.open(image_path).convert("RGB")
-        logging.info("Step 1: Running Donut model for layout analysis...")
-        donut_data = step1_run_donut(image)
-        medication_lines = [
-            item.get("text", "")
-            for item in donut_data.get("menu", [])
-            if "medi" in item.get("category", "").lower()
-        ]
-        logging.info("Step 2: Running Phi-3 model for medication refinement...")
-        phi3_refined_meds = [step2_run_phi3(line) for line in medication_lines]
-        logging.info("Step 3: Running Gemini model as the expert resolver...")
-        final_info = step3_run_gemini_resolver(image, donut_data, phi3_refined_meds)
-        if final_info.get("error"):
-            return final_info
-        result = {
-            "info": final_info,
-            "error": None,
-            "debug_info": {
-                "donut_output": donut_data,
-                "phi3_refinements": phi3_refined_meds,
-            },
-        }
-        return result
-    except Exception as e:
-        logging.error(f"Hybrid extraction pipeline failed: {e}", exc_info=True)
-        return {"error": f"An unexpected error occurred in the pipeline: {e}"}

 import re
 import json
 import logging
 import tempfile
 import torch
+import streamlit as st
+from typing import Dict, Any, List
 from PIL import Image
 # Suppress verbose backend logs
 os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"
 try:
+    from transformers import pipeline, DonutProcessor, VisionEncoderDecoderModel
     from huggingface_hub import login
     import google.generativeai as genai
 except ImportError as e:
     raise
 from config import (
+    HF_TOKEN, HF_MODELS, GOOGLE_API_KEY,
+    GOOGLE_APPLICATION_CREDENTIALS, GEMINI_MODEL_NAME, DEVICE, USE_GPU
 )
+# Configure Logging & Auth
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
+if HF_TOKEN: login(token=HF_TOKEN)
+class PrescriptionProcessor:
+    """Encapsulates the entire hybrid pipeline to resolve the 'self' error."""
     def __init__(self):
+        self.model_cache = {}
+        self.temp_cred_file = None
+        self._load_all_models()
+    def _load_model(self, name: str):
+        if name in self.model_cache: return
         model_id = HF_MODELS.get(name)
+        if not model_id: return
         logging.info(f"Loading model '{name}' ({model_id}) to device '{DEVICE}'...")
         try:
             if name == "donut":
                 processor = DonutProcessor.from_pretrained(model_id)
                 model = VisionEncoderDecoderModel.from_pretrained(model_id, **quantization_config)
+                self.model_cache[name] = {"model": model, "processor": processor}
             elif name == "phi3":
+                model = pipeline("text-generation", model=model_id, torch_dtype=torch.bfloat16, trust_remote_code=True, **quantization_config)
+                self.model_cache[name] = {"model": model}
             logging.info(f"Model '{name}' loaded successfully.")
         except Exception as e:
             logging.error(f"Failed to load model '{name}': {e}", exc_info=True)
+    def _load_gemini_client(self):
+        if "gemini" in self.model_cache: return
         if creds_json_str := GOOGLE_APPLICATION_CREDENTIALS:
+            if not self.temp_cred_file or not os.path.exists(self.temp_cred_file):
                 with tempfile.NamedTemporaryFile(mode="w", delete=False, suffix=".json") as tfp:
                     tfp.write(creds_json_str)
+                    self.temp_cred_file = tfp.name
+                os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = self.temp_cred_file
         try:
             genai.configure(api_key=GOOGLE_API_KEY)
+            self.model_cache["gemini"] = genai.GenerativeModel(GEMINI_MODEL_NAME)
         except Exception as e:
             logging.error(f"Gemini init failed: {e}")
+    def _load_all_models(self):
+        self._load_model("donut")
+        self._load_model("phi3")
+        self._load_gemini_client()
+    def _run_donut(self, image: Image.Image) -> Dict[str, Any]:
+        components = self.model_cache.get("donut")
+        if not components: return {"error": "Donut model not available."}
+        model, processor = components["model"].to(DEVICE), components["processor"]
+        task_prompt = "<s_cord-v2>"
+        decoder_input_ids = processor.tokenizer(task_prompt, add_special_tokens=False, return_tensors="pt").input_ids.to(DEVICE)
+        pixel_values = processor(image, return_tensors="pt").pixel_values.to(DEVICE)
+        outputs = model.generate(pixel_values, decoder_input_ids=decoder_input_ids, max_length=model.decoder.config.max_position_embeddings, early_stopping=True, use_cache=True, num_beams=1, bad_words_ids=[[processor.tokenizer.unk_token_id]], return_dict_in_generate=True)
+        sequence = processor.batch_decode(outputs.sequences)[0].replace(processor.tokenizer.eos_token, "").replace(processor.tokenizer.pad_token, "")
+        return processor.token2json(sequence)
+    def _run_phi3(self, medication_text: str) -> str:
+        components = self.model_cache.get("phi3")
+        if not components: return medication_text
+        pipe = components["model"]
+        prompt = f"Normalize the following prescription medication line into its components (drug, dosage, frequency). Raw text: '{medication_text}'"
+        outputs = pipe(prompt, max_new_tokens=100, do_sample=False)
+        return outputs[0]['generated_text'].split("Normalized:")[-1].strip()
+    def _run_gemini_resolver(self, image: Image.Image, donut_result: Dict, phi3_results: List[str]) -> Dict[str, Any]:
+        gemini_client = self.model_cache.get("gemini")
+        if not gemini_client: return {"error": "Gemini resolver not available."}
+        prompt = f"""
+        You are an expert pharmacist’s assistant...
+        (Your detailed prompt from the previous turn goes here)
+        ...
+        **Final JSON Schema**
+        ```json
+        {{
+          "Name": "string or null", "Date": "string (MM/DD/YYYY) or null", "Age": "string or null", "PhysicianName": "string or null",
+          "Medications": [{{"drug_raw": "string", "dosage": "string or null", "frequency": "string or null"}}]
+        }}
+        ```
+        """
+        try:
+            response = gemini_client.generate_content([prompt, image], generation_config={"response_mime_type": "application/json"})
+            return json.loads(response.text)
+        except Exception as e:
+            logging.error(f"Gemini resolver failed: {e}")
+            # This is where your original error was being generated from
+            return {"error": f"Gemini failed to resolve data: {e}"}
+    def process(self, image_path: str) -> Dict[str, Any]:
+        try:
+            image = Image.open(image_path).convert("RGB")
+            donut_data = self._run_donut(image)
+            med_lines = [item.get('text', '') for item in donut_data.get('menu', []) if 'medi' in item.get('category', '').lower()]
+            phi3_refined_meds = [self._run_phi3(line) for line in med_lines]
+            final_info = self._run_gemini_resolver(image, donut_data, phi3_refined_meds)
+            if final_info.get("error"): return final_info
+            return {"info": final_info, "error": None, "debug_info": {"donut_output": donut_data, "phi3_refinements": phi3_refined_meds}}
+        except Exception as e:
+            logging.error(f"Hybrid extraction pipeline failed: {e}", exc_info=True)
+            return {"error": f"An unexpected error occurred in the pipeline: {e}"}
+@st.cache_resource
+def get_processor():
+    return PrescriptionProcessor()
 def extract_prescription_info(image_path: str) -> Dict[str, Any]:
+    processor = get_processor()
+    return processor.process(image_path)