File size: 16,144 Bytes

7a8bc6d

import streamlit as st
import torch
import numpy as np
import pickle
import json
from transformers import AutoTokenizer, AutoModel
import torch.nn as nn
import os

# Set page config
st.set_page_config(
    page_title="Drug Prediction and Polypharmacy System", 
    page_icon="💊",
    layout="wide"
)

# Model class definition - must match the training model architecture
class EnhancedMedicationModel(nn.Module):
    def __init__(self, model_name, num_medications, num_polypharmacy_classes, num_disease_classes, dropout_rate=0.3):
        super().__init__()
        self.bert = AutoModel.from_pretrained(model_name)
        self.dropout = nn.Dropout(dropout_rate)
        hidden_size = self.bert.config.hidden_size

        # Common representation layer
        self.common_dense = nn.Linear(hidden_size, hidden_size)

        # Task-specific layers with increased complexity
        # Medication prediction head (multi-label)
        self.medication_classifier = nn.Sequential(
            nn.Linear(hidden_size, hidden_size//2),
            nn.ReLU(),
            nn.Dropout(dropout_rate),
            nn.Linear(hidden_size//2, num_medications)
        )

        # Polypharmacy risk head (multi-class)
        self.polypharmacy_classifier = nn.Sequential(
            nn.Linear(hidden_size, hidden_size//2),
            nn.ReLU(),
            nn.Dropout(dropout_rate),
            nn.Linear(hidden_size//2, num_polypharmacy_classes)
        )

        # Disease prediction head (multi-class)
        self.disease_classifier = nn.Sequential(
            nn.Linear(hidden_size, hidden_size//2),
            nn.ReLU(),
            nn.Dropout(dropout_rate),
            nn.Linear(hidden_size//2, num_disease_classes)
        )

        # Apply weight initialization
        self._init_weights()

    def _init_weights(self):
        # Initialize weights for better convergence
        for module in [self.medication_classifier, self.polypharmacy_classifier,
                      self.disease_classifier, self.common_dense]:
            if isinstance(module, nn.Sequential):
                for layer in module:
                    if isinstance(layer, nn.Linear):
                        nn.init.xavier_normal_(layer.weight)
                        nn.init.zeros_(layer.bias)
            elif isinstance(module, nn.Linear):
                nn.init.xavier_normal_(module.weight)
                nn.init.zeros_(layer.bias)

    def forward(self, input_ids, attention_mask):
        outputs = self.bert(input_ids=input_ids, attention_mask=attention_mask)
        pooled_output = outputs.last_hidden_state[:, 0, :]  # CLS token
        pooled_output = self.dropout(pooled_output)

        # Common representation
        common_features = torch.relu(self.common_dense(pooled_output))

        medication_logits = self.medication_classifier(common_features)
        polypharmacy_logits = self.polypharmacy_classifier(common_features)
        disease_logits = self.disease_classifier(common_features)

        return medication_logits, polypharmacy_logits, disease_logits

@st.cache_resource
def load_model_and_resources():
    """Load model and necessary resources (cached for performance)"""
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    
    # Load model configuration - fixed file paths
    with open('streamlit_model/model_config.json', 'r') as f:
        model_config = json.load(f)
    
    # Initialize model
    model_name = model_config['model_name']
    tokenizer = AutoTokenizer.from_pretrained(model_name)
    
    # Create model architecture
    model = EnhancedMedicationModel(
        model_name=model_name,
        num_medications=model_config['num_medications'],
        num_polypharmacy_classes=model_config['num_polypharmacy_classes'],
        num_disease_classes=model_config['num_disease_classes'],
        dropout_rate=0.3
    )
    
    # Load trained weights - fixed file path
    model.load_state_dict(torch.load('streamlit_model/model_state_dict.pt', map_location=device))
    model = model.to(device)
    model.eval()
    
    # Load encoders - fixed file path
    with open('streamlit_model/label_encoders.pkl', 'rb') as f:
        encoders = pickle.load(f)
    
    # Load lookup data - fixed file path
    with open('streamlit_model/lookup_data.pkl', 'rb') as f:
        lookup_data = pickle.load(f)
    
    return {
        'model': model,
        'tokenizer': tokenizer,
        'mlb': encoders['mlb'],
        'le_risk': encoders['le_risk'],
        'le_disease': encoders['le_disease'],
        'lookup_data': lookup_data,
        'device': device
    }

def predict_patient_health_profile(patient_data, resources):
    """

    Predict health profile for a patient based on input data

    """
    model = resources['model']
    tokenizer = resources['tokenizer']
    mlb = resources['mlb']
    le_risk = resources['le_risk']
    le_disease = resources['le_disease']
    lookup_data = resources['lookup_data']
    device = resources['device']
    
    # Create text input
    text_input = f"Patient age {patient_data['age']}, gender {patient_data['gender']}, blood group {patient_data['blood_group']}, weight {patient_data['weight']}kg. " +                 f"SYMPTOMS: {patient_data['symptoms']}. " +                 f"SEVERITY: {patient_data['severity']}."
    
    # Tokenize
    encoding = tokenizer(
        text_input,
        add_special_tokens=True,
        max_length=256,
        padding='max_length',
        truncation=True,
        return_tensors='pt'
    )
    
    # Move to device
    input_ids = encoding['input_ids'].to(device)
    attention_mask = encoding['attention_mask'].to(device)
    
    # Get predictions
    with torch.no_grad():
        medication_logits, polypharmacy_logits, disease_logits = model(input_ids, attention_mask)
        medication_preds = torch.sigmoid(medication_logits) > 0.5
        polypharmacy_pred = torch.argmax(polypharmacy_logits, dim=1)
        disease_pred = torch.argmax(disease_logits, dim=1)
    
    # Convert predictions to human-readable format
    predicted_medications = mlb.classes_[medication_preds[0].cpu().numpy()]
    predicted_risk = le_risk.classes_[polypharmacy_pred.item()]
    predicted_disease = le_disease.classes_[disease_pred.item()]
    
    # Get medication probabilities for all medications
    medication_probs = torch.sigmoid(medication_logits).cpu().numpy()[0]
    med_prob_dict = {med: prob for med, prob in zip(mlb.classes_, medication_probs)}
    
    # Sort medications by probability
    sorted_meds = sorted(med_prob_dict.items(), key=lambda x: x[1], reverse=True)
    top_meds = sorted_meds[:5]  # Get top 5 medications
    
    # Format medication results
    med_results = []
    for i, med in enumerate(predicted_medications[:3]):
        med_details = {
            'medication': med,
            'dosage': 'Consult doctor',
            'frequency': 'Consult doctor',
            'instruction': 'Consult doctor',
            'duration': 'As prescribed',
            'confidence': float(med_prob_dict[med])
        }
        med_results.append(med_details)
    
    # Get disease information
    disease_causes = lookup_data['disease_causes_dict'].get(predicted_disease, "Unknown causes")
    disease_prevention = lookup_data['disease_prevention_dict'].get(predicted_disease, "Consult healthcare provider")
    
    # Get polypharmacy recommendation
    polypharmacy_recommendation = lookup_data['polypharmacy_recommendation_dict'].get(
        predicted_risk, "Consult healthcare provider"
    )
    
    # Get personalized health tip
    age_decade = (patient_data['age'] // 10) * 10
    health_tip_key = (predicted_disease, age_decade, patient_data['gender'])
    personalized_health_tip = lookup_data['health_tips_dict'].get(
        health_tip_key, "Maintain a balanced diet and regular exercise routine."
    )
    
    # Return comprehensive results
    return {
        'patient_name': patient_data['name'],  # Include patient name in results
        'predicted_disease': predicted_disease,
        'disease_causes': disease_causes,
        'disease_prevention': disease_prevention,
        'medications': med_results,
        'polypharmacy_risk': predicted_risk,
        'polypharmacy_recommendation': polypharmacy_recommendation,
        'personalized_health_tips': personalized_health_tip,
        'medication_probabilities': {med: float(prob) for med, prob in top_meds}
    }

def main():
    # App title and description
    st.title("🏥 Drug Prediction and Polypharmacy System")
    st.markdown("Enter patient information to receive medication recommendations, disease prediction, and polypharmacy risk assessment.")
    
    try:
        # Load model and resources
        with st.spinner("Loading medical model and resources..."):
            resources = load_model_and_resources()
        
        # Create two columns for input form
        col1, col2 = st.columns(2)
        
        # Patient information inputs
        with col1:
            st.subheader("Patient Information")
            # Add patient name input field
            name = st.text_input("Patient Name", value="John Doe")
            age = st.number_input("Age", min_value=1, max_value=120, value=45)
            gender = st.selectbox("Gender", options=["Male", "Female", "Other"])
            blood_group = st.selectbox("Blood Group", options=["A+", "A-", "B+", "B-", "AB+", "AB-", "O+", "O-"])
            weight = st.number_input("Weight (kg)", min_value=1.0, max_value=300.0, value=70.0, step=0.1)
        
        with col2:
            st.subheader("Symptoms Information")
            
            # Common symptoms options
            common_symptoms = [
                "Headache", "Fever", "Fatigue", "Nausea", "Cough", 
                "Sore throat", "Shortness of breath", "Chest pain", 
                "Dizziness", "Abdominal pain", "Vomiting", "Diarrhea",
                "Muscle ache", "Joint pain", "Rash", "Loss of appetite"
            ]
            
            # Use multiselect for symptoms selection
            selected_symptoms = st.multiselect(
                "Select Symptoms", 
                options=common_symptoms,
                default=["Headache", "Fever", "Fatigue"]
            )
            
            # Custom symptom input
            custom_symptom = st.text_input("Add other symptom (if not in list)")
            if custom_symptom:
                selected_symptoms.append(custom_symptom)
            
            # Convert selected symptoms to string format as expected by the model
            symptoms = "; ".join(selected_symptoms)
            
            # More compact severity selection
            st.subheader("Symptom Severity")
            
            # Define severity levels
            severity_levels = {
                "Very Mild": 1,
                "Mild": 2,
                "Moderate": 3,
                "Severe": 4,
                "Very Severe": 5
            }
            
            severity_dict = {}
            
            # Create a more compact layout with 2 columns for severity selection
            if selected_symptoms:
                cols = st.columns(2)
                for i, symptom in enumerate(selected_symptoms):
                    # Alternate between columns
                    with cols[i % 2]:
                        severity_option = st.selectbox(
                            f"{symptom}",
                            options=list(severity_levels.keys()),
                            index=1  # Default to "Mild"
                        )
                        severity_dict[symptom] = severity_levels[severity_option]
            
            # Convert severity dict to string format as expected by the model
            severity = "; ".join([f"{symptom}:{score}" for symptom, score in severity_dict.items()])
            
        # Submit button
        if st.button("Generate Health Profile", type="primary"):
            with st.spinner("Analyzing patient data and generating health profile..."):
                # Prepare patient data
                patient_data = {
                    'name': name,  # Include name in patient data
                    'age': age,
                    'gender': gender,
                    'blood_group': blood_group,
                    'weight': weight,
                    'symptoms': symptoms,
                    'severity': severity
                }
                
                # Get prediction
                prediction = predict_patient_health_profile(patient_data, resources)
                
                # Display results in three columns
                st.subheader(f"🔍 Health Profile Analysis Results for {prediction['patient_name']}")
                
                col1, col2, col3 = st.columns([1, 1, 1])
                
                # Column 1: Disease information
                with col1:
                    st.markdown("### 🦠 Disease Prediction")
                    st.markdown(f"**Predicted Disease**: {prediction['predicted_disease']}")
                    
                    with st.expander("Disease Causes"):
                        st.write(prediction['disease_causes'])
                    
                    with st.expander("Prevention Methods"):
                        st.write(prediction['disease_prevention'])
                
                # Column 2: Medication recommendations
                with col2:
                    st.markdown("### 💊 Medication Recommendations")
                    for i, med in enumerate(prediction['medications']):
                        st.markdown(f"**{i+1}. {med['medication']}** (Confidence: {med['confidence']:.2f})")
                        med_details = f"""

                        - **Dosage:** {med['dosage']}

                        - **Frequency:** {med['frequency']}

                        - **Instructions:** {med['instruction']}

                        - **Duration:** {med['duration']}

                        """
                        st.markdown(med_details)
                        st.divider()
                
                # Column 3: Risk assessment and health tips
                with col3:
                    st.markdown("### ⚠️ Polypharmacy Assessment")
                    risk_color = "green" if prediction['polypharmacy_risk'] == "Low" else                                 "orange" if prediction['polypharmacy_risk'] == "Medium" else "red"
                    st.markdown(f"**Risk Level**: <span style='color:{risk_color};font-weight:bold;'>{prediction['polypharmacy_risk']}</span>", 
                                unsafe_allow_html=True)
                    st.markdown(f"**Recommendation**: {prediction['polypharmacy_recommendation']}")
                    
                    st.markdown("### 🌿 Personalized Health Tips")
                    st.info(prediction['personalized_health_tips'])
                    
                # Display medication probabilities as text with progress bars
                st.subheader("Medication Confidence Scores")
                med_names = list(prediction['medication_probabilities'].keys())
                med_probs = list(prediction['medication_probabilities'].values())
                
                # Display each medication with its confidence score as text and progress bar
                for med_name, med_prob in zip(med_names, med_probs):
                    st.text(f"{med_name}: {med_prob:.2f}")
                    st.progress(med_prob)
                    
    except Exception as e:
        st.error(f"An error occurred: {str(e)}")
        st.error("Please make sure all model files are correctly placed in the 'streamlit_model' directory")

if __name__ == "__main__":
    main()