ranimeree commited on
Commit
bc355ae
·
verified ·
1 Parent(s): 4fac2c1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +156 -63
app.py CHANGED
@@ -1,78 +1,171 @@
1
  import gradio as gr
2
-
3
  import pandas as pd
4
-
5
  import numpy as np
6
  import pickle
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
 
8
- def decode_file(file_path):
9
- with open(file_path, 'rb') as file:
10
- obj = pickle.load(file)
11
- return obj
12
-
13
- model = decode_file('model.pkl')
14
-
15
-
16
- def predict(gender, age, hypertension, ever_married, work_type, heart_disease, avg_glucose_level, bmi, smoking_status, Residence_type):
17
- # Mapping for categorical variables
18
- gender_mapping = {'Male': 1, 'Female': 0}
19
- hypertension_mapping = {'Yes': 1, 'No': 0}
20
- ever_married_mapping = {'Yes': 1, 'No': 0}
21
- work_type_mapping = {'Private': 2, 'Self-employed': 4, 'Govt_job': 3, 'children': 1, 'Never_worked': 0}
22
- heart_disease_mapping = {'Yes': 1, 'No': 0}
23
- smoking_status_mapping = {'formerly smoked': 3, 'smokes': 1, 'never smoked': 2, 'Unknown': 0}
24
- Residence_type_mapping = {'Urban': 1, 'Rural': 0}
25
-
26
- # Map categorical variables to their corresponding numerical values
27
- gender = gender_mapping[gender]
28
- hypertension = hypertension_mapping[hypertension]
29
- ever_married = ever_married_mapping[ever_married]
30
- work_type = work_type_mapping[work_type]
31
- heart_disease = heart_disease_mapping[heart_disease]
32
- smoking_status = smoking_status_mapping[smoking_status]
33
- Residence_type = Residence_type_mapping[Residence_type]
34
-
35
- inputs = [gender, age, hypertension, ever_married, work_type, heart_disease, avg_glucose_level, bmi, smoking_status, Residence_type]
36
- input_labels = ['gender', 'age', 'hypertension', 'ever_married', 'work_type', 'heart_disease', 'avg_glucose_level', 'bmi', 'smoking_status', 'Residence_type']
37
-
38
- # Convert the input into a pandas DataFrame
39
- input_df = pd.DataFrame([inputs], columns=input_labels)
40
-
41
- # Predict the stroke probability
42
- prediction = model.predict_proba(input_df)[0][1]
43
-
44
- # Return the prediction
45
- result = "The probability of stroke is {:.2f}%".format(prediction * 100) # to give a percentage
46
- return result
47
-
48
-
49
-
50
-
51
-
52
-
53
- input_labels = [
54
- 'gender', 'age', 'hypertension', 'ever_married', 'work_type',
55
- 'heart_disease', 'avg_glucose_level', 'bmi', 'smoking_status', 'Residence_type'
56
- ]
57
  # Create the Gradio interface
58
  iface = gr.Interface(
59
  fn=predict,
60
  inputs=[
61
- gr.components.Radio(choices=['Female', 'Male'], label="Gender"),
62
- gr.components.Slider(label="Age"),
63
- gr.components.Radio(choices=['Yes', 'No'], label="Hypertension"),
64
- gr.components.Radio(choices=['Yes', 'No'], label="Ever Married"),
65
- gr.components.Radio(choices=['Private', 'Self-employed', 'Govt_job', 'children', 'Never_worked'], label="Work Type"),
66
- gr.components.Radio(choices=['Yes', 'No'], label="Heart Disease"),
67
- gr.components.Number(label="Average Glucose Level"),
68
- gr.components.Slider(label="BMI"),
69
- gr.components.Radio(choices=['formerly smoked', 'never smoked', 'smokes', 'Unknown'], label="Smoking Status"),
70
- gr.components.Radio(choices=['Urban', 'Rural'], label="Residence Type")
71
  ],
72
  outputs='text',
73
  title='Stroke Probability Predictor',
74
  description='Predicts the probability of having a stroke based on input features.'
75
  )
76
 
77
-
78
- iface.launch()
 
1
  import gradio as gr
 
2
  import pandas as pd
 
3
  import numpy as np
4
  import pickle
5
+ from sklearn.preprocessing import StandardScaler
6
+ import sklearn
7
+ import os
8
+
9
+ print(f"Prediction environment scikit-learn version: {sklearn.__version__}")
10
+
11
+ def load_model():
12
+ """Load the model with version compatibility check"""
13
+ possible_paths = [
14
+ "/content/Project/metadata/mlflow/mlartifacts/0951b451e9554321adaebc8f9f15ac8c/artifacts/train/model/artifacts/sk_model/model.pkl",
15
+ "model.pkl",
16
+ "/home/user/app/model.pkl",
17
+ "./model.pkl",
18
+ "../model.pkl"
19
+ ]
20
+
21
+ for path in possible_paths:
22
+ try:
23
+ if os.path.exists(path):
24
+ with open(path, 'rb') as f:
25
+ try:
26
+ model = pickle.load(f)
27
+ # Test if model can make predictions
28
+ dummy_data = pd.DataFrame({
29
+ 'num__age': [0],
30
+ 'num__avg_glucose_level': [0],
31
+ 'num__bmi': [0],
32
+ 'cat__gender_Male': [0],
33
+ 'cat__gender_Other': [0],
34
+ 'cat__hypertension_1': [0],
35
+ 'cat__heart_disease_1': [0],
36
+ 'cat__ever_married_Yes': [0],
37
+ 'cat__work_type_Never_worked': [0],
38
+ 'cat__work_type_Private': [0],
39
+ 'cat__work_type_Self-employed': [0],
40
+ 'cat__work_type_children': [0],
41
+ 'cat__Residence_type_Urban': [0],
42
+ 'cat__smoking_status_formerly smoked': [0],
43
+ 'cat__smoking_status_never smoked': [0],
44
+ 'cat__smoking_status_smokes': [0]
45
+ })
46
+ model.predict_proba(dummy_data)
47
+ print(f"Successfully loaded and tested model from {path}")
48
+ return model
49
+ except Exception as e:
50
+ print(f"Model loaded but failed testing from {path}: {e}")
51
+ continue
52
+ except Exception as e:
53
+ print(f"Failed to load from {path}: {e}")
54
+ continue
55
+
56
+ print("Could not load model from any location")
57
+ return None
58
+
59
+ # Load the model once when starting the app
60
+ model = load_model()
61
+
62
+ def preprocess_input(data_dict):
63
+ """Preprocess input data to match the training format"""
64
+ # First create DataFrame with original columns
65
+ df = pd.DataFrame([data_dict])
66
+
67
+ # Store original features before transformation
68
+ original_df = df.copy()
69
+
70
+ # Numeric features
71
+ numeric_features = ['age', 'avg_glucose_level', 'bmi']
72
+
73
+ # Scale numeric features and add prefix
74
+ scaler = StandardScaler()
75
+ scaled_features = scaler.fit_transform(df[numeric_features])
76
+ for i, feat in enumerate(numeric_features):
77
+ df[f'num__{feat}'] = scaled_features[:, i]
78
+
79
+ # Create categorical features
80
+ # Gender
81
+ df['cat__gender_Male'] = (df['gender'] == 'Male').astype(float)
82
+ df['cat__gender_Other'] = 0.0
83
+
84
+ # Hypertension
85
+ df['cat__hypertension_1'] = df['hypertension'].astype(float)
86
+
87
+ # Heart Disease
88
+ df['cat__heart_disease_1'] = df['heart_disease'].astype(float)
89
+
90
+ # Ever Married
91
+ df['cat__ever_married_Yes'] = (df['ever_married'] == 'Yes').astype(float)
92
+
93
+ # Work Type
94
+ df['cat__work_type_Never_worked'] = (df['work_type'] == 'Never_worked').astype(float)
95
+ df['cat__work_type_Private'] = (df['work_type'] == 'Private').astype(float)
96
+ df['cat__work_type_Self-employed'] = (df['work_type'] == 'Self-employed').astype(float)
97
+ df['cat__work_type_children'] = (df['work_type'] == 'children').astype(float)
98
+
99
+ # Residence Type
100
+ df['cat__Residence_type_Urban'] = (df['Residence_type'] == 'Urban').astype(float)
101
+
102
+ # Smoking Status
103
+ df['cat__smoking_status_formerly smoked'] = (df['smoking_status'] == 'formerly smoked').astype(float)
104
+ df['cat__smoking_status_never smoked'] = (df['smoking_status'] == 'never smoked').astype(float)
105
+ df['cat__smoking_status_smokes'] = (df['smoking_status'] == 'smokes').astype(float)
106
+
107
+ # Select only the transformed columns in the correct order
108
+ feature_columns = [
109
+ 'num__age', 'num__avg_glucose_level', 'num__bmi',
110
+ 'cat__gender_Male', 'cat__gender_Other', 'cat__hypertension_1',
111
+ 'cat__heart_disease_1', 'cat__ever_married_Yes',
112
+ 'cat__work_type_Never_worked', 'cat__work_type_Private',
113
+ 'cat__work_type_Self-employed', 'cat__work_type_children',
114
+ 'cat__Residence_type_Urban', 'cat__smoking_status_formerly smoked',
115
+ 'cat__smoking_status_never smoked', 'cat__smoking_status_smokes'
116
+ ]
117
+
118
+ return df[feature_columns]
119
+
120
+ def predict(gender, age, hypertension, ever_married, work_type, heart_disease,
121
+ avg_glucose_level, bmi, smoking_status, Residence_type):
122
+ """Make prediction using the loaded model"""
123
+ if model is None:
124
+ return "Error: Model not loaded"
125
+
126
+ # Create input dictionary
127
+ input_data = {
128
+ 'gender': gender,
129
+ 'age': float(age), # Ensure numeric
130
+ 'hypertension': 1 if hypertension == 'Yes' else 0,
131
+ 'heart_disease': 1 if heart_disease == 'Yes' else 0,
132
+ 'ever_married': ever_married,
133
+ 'work_type': work_type,
134
+ 'Residence_type': Residence_type,
135
+ 'avg_glucose_level': float(avg_glucose_level), # Ensure numeric
136
+ 'bmi': float(bmi), # Ensure numeric
137
+ 'smoking_status': smoking_status
138
+ }
139
+
140
+ # Preprocess the input
141
+ processed_input = preprocess_input(input_data)
142
+
143
+ # Use the loaded model
144
+ try:
145
+ prediction = model.predict_proba(processed_input)[0][1]
146
+ return f"The probability of stroke is {prediction:.2%}"
147
+ except Exception as e:
148
+ return f"Error making prediction: {str(e)}"
149
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
150
  # Create the Gradio interface
151
  iface = gr.Interface(
152
  fn=predict,
153
  inputs=[
154
+ gr.Radio(choices=['Female', 'Male'], label="Gender"),
155
+ gr.Slider(minimum=0, maximum=100, label="Age"),
156
+ gr.Radio(choices=['Yes', 'No'], label="Hypertension"),
157
+ gr.Radio(choices=['Yes', 'No'], label="Ever Married"),
158
+ gr.Radio(choices=['Private', 'Self-employed', 'Govt_job', 'children', 'Never_worked'], label="Work Type"),
159
+ gr.Radio(choices=['Yes', 'No'], label="Heart Disease"),
160
+ gr.Number(label="Average Glucose Level"),
161
+ gr.Slider(minimum=10, maximum=50, label="BMI"),
162
+ gr.Radio(choices=['formerly smoked', 'never smoked', 'smokes', 'Unknown'], label="Smoking Status"),
163
+ gr.Radio(choices=['Urban', 'Rural'], label="Residence Type")
164
  ],
165
  outputs='text',
166
  title='Stroke Probability Predictor',
167
  description='Predicts the probability of having a stroke based on input features.'
168
  )
169
 
170
+ if __name__ == "__main__":
171
+ iface.launch()