ranimeree commited on
Commit
1d8362d
·
verified ·
1 Parent(s): 9b1573b

update app.py using joblib.load

Browse files
Files changed (1) hide show
  1. app.py +62 -100
app.py CHANGED
@@ -1,115 +1,77 @@
1
  import gradio as gr
 
2
  import pandas as pd
 
3
  import numpy as np
4
  import pickle
5
- from sklearn.preprocessing import StandardScaler
6
- import sklearn
7
-
8
- print(f"Prediction environment scikit-learn version: {sklearn.__version__}")
9
-
10
- def preprocess_input(data_dict):
11
- """Preprocess input data to match the training format"""
12
- df = pd.DataFrame([data_dict])
13
-
14
- # Numeric features - add prefix 'num__'
15
- numeric_features = ['age', 'avg_glucose_level', 'bmi']
16
- for feat in numeric_features:
17
- df[f'num__{feat}'] = df[feat]
18
-
19
- # Scale numeric features
20
- scaler = StandardScaler()
21
- for feat in numeric_features:
22
- df[f'num__{feat}'] = scaler.fit_transform(df[[feat]])
23
-
24
- # Create categorical features with proper prefixes
25
- # gender
26
- df['cat__gender_Male'] = (df['gender'] == 'Male').astype(float)
27
- df['cat__gender_Other'] = 0.0 # Assuming no 'Other' gender in our interface
28
-
29
- # hypertension
30
- df['cat__hypertension_1'] = df['hypertension'].astype(float)
31
-
32
- # heart_disease
33
- df['cat__heart_disease_1'] = df['heart_disease'].astype(float)
34
-
35
- # ever_married
36
- df['cat__ever_married_Yes'] = (df['ever_married'] == 'Yes').astype(float)
37
-
38
- # work_type
39
- df['cat__work_type_Never_worked'] = (df['work_type'] == 'Never_worked').astype(float)
40
- df['cat__work_type_Private'] = (df['work_type'] == 'Private').astype(float)
41
- df['cat__work_type_Self-employed'] = (df['work_type'] == 'Self-employed').astype(float)
42
- df['cat__work_type_children'] = (df['work_type'] == 'children').astype(float)
43
-
44
- # Residence_type
45
- df['cat__Residence_type_Urban'] = (df['Residence_type'] == 'Urban').astype(float)
46
-
47
- # smoking_status
48
- df['cat__smoking_status_formerly smoked'] = (df['smoking_status'] == 'formerly smoked').astype(float)
49
- df['cat__smoking_status_never smoked'] = (df['smoking_status'] == 'never smoked').astype(float)
50
- df['cat__smoking_status_smokes'] = (df['smoking_status'] == 'smokes').astype(float)
51
-
52
- # Select only the transformed columns in the correct order
53
- expected_columns = [
54
- 'num__age', 'num__avg_glucose_level', 'num__bmi',
55
- 'cat__gender_Male', 'cat__gender_Other', 'cat__hypertension_1',
56
- 'cat__heart_disease_1', 'cat__ever_married_Yes',
57
- 'cat__work_type_Never_worked', 'cat__work_type_Private',
58
- 'cat__work_type_Self-employed', 'cat__work_type_children',
59
- 'cat__Residence_type_Urban', 'cat__smoking_status_formerly smoked',
60
- 'cat__smoking_status_never smoked', 'cat__smoking_status_smokes'
61
- ]
62
-
63
- return df[expected_columns]
64
-
65
- def predict(gender, age, hypertension, ever_married, work_type, heart_disease,
66
- avg_glucose_level, bmi, smoking_status, Residence_type):
67
- """Make prediction using the loaded model"""
68
- # Create input dictionary
69
- input_data = {
70
- 'gender': gender,
71
- 'age': age,
72
- 'hypertension': 1 if hypertension == 'Yes' else 0,
73
- 'heart_disease': 1 if heart_disease == 'Yes' else 0,
74
- 'ever_married': ever_married,
75
- 'work_type': work_type,
76
- 'Residence_type': Residence_type,
77
- 'avg_glucose_level': avg_glucose_level,
78
- 'bmi': bmi,
79
- 'smoking_status': smoking_status
80
- }
81
-
82
- # Preprocess the input
83
- processed_input = preprocess_input(input_data)
84
-
85
- # Load and use the model
86
- try:
87
- with open('model.pkl', 'rb') as file:
88
- model = pickle.load(file)
89
- prediction = model.predict_proba(processed_input)[0][1]
90
- return f"The probability of stroke is {prediction:.2%}"
91
- except Exception as e:
92
- return f"Error making prediction: {str(e)}"
93
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
94
  # Create the Gradio interface
95
  iface = gr.Interface(
96
  fn=predict,
97
  inputs=[
98
- gr.Radio(choices=['Female', 'Male'], label="Gender"),
99
- gr.Slider(minimum=0, maximum=100, label="Age"),
100
- gr.Radio(choices=['Yes', 'No'], label="Hypertension"),
101
- gr.Radio(choices=['Yes', 'No'], label="Ever Married"),
102
- gr.Radio(choices=['Private', 'Self-employed', 'Govt_job', 'children', 'Never_worked'], label="Work Type"),
103
- gr.Radio(choices=['Yes', 'No'], label="Heart Disease"),
104
- gr.Number(label="Average Glucose Level"),
105
- gr.Slider(minimum=10, maximum=50, label="BMI"),
106
- gr.Radio(choices=['formerly smoked', 'never smoked', 'smokes', 'Unknown'], label="Smoking Status"),
107
- gr.Radio(choices=['Urban', 'Rural'], label="Residence Type")
108
  ],
109
  outputs='text',
110
  title='Stroke Probability Predictor',
111
  description='Predicts the probability of having a stroke based on input features.'
112
  )
113
 
114
- if __name__ == "__main__":
115
- iface.launch()
 
1
  import gradio as gr
2
+ import dill
3
  import pandas as pd
4
+ import xgboost as xgb
5
  import numpy as np
6
  import pickle
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
 
8
+ import joblib
9
+
10
+ model = joblib.load('model.pkl')
11
+ print(model)
12
+
13
+
14
+
15
+ def predict(gender, age, hypertension, ever_married, work_type, heart_disease, avg_glucose_level, bmi, smoking_status, Residence_type):
16
+ # Mapping for categorical variables
17
+ gender_mapping = {'Male': 1, 'Female': 0}
18
+ hypertension_mapping = {'Yes': 1, 'No': 0}
19
+ ever_married_mapping = {'Yes': 1, 'No': 0}
20
+ work_type_mapping = {'Private': 2, 'Self-employed': 4, 'Govt_job': 3, 'children': 1, 'Never_worked': 0}
21
+ heart_disease_mapping = {'Yes': 1, 'No': 0}
22
+ smoking_status_mapping = {'formerly smoked': 3, 'smokes': 1, 'never smoked': 2, 'Unknown': 0}
23
+ Residence_type_mapping = {'Urban': 1, 'Rural': 0}
24
+
25
+ # Map categorical variables to their corresponding numerical values
26
+ gender = gender_mapping[gender]
27
+ hypertension = hypertension_mapping[hypertension]
28
+ ever_married = ever_married_mapping[ever_married]
29
+ work_type = work_type_mapping[work_type]
30
+ heart_disease = heart_disease_mapping[heart_disease]
31
+ smoking_status = smoking_status_mapping[smoking_status]
32
+ Residence_type = Residence_type_mapping[Residence_type]
33
+
34
+ inputs = [gender, age, hypertension, ever_married, work_type, heart_disease, avg_glucose_level, bmi, smoking_status, Residence_type]
35
+ input_labels = ['gender', 'age', 'hypertension', 'ever_married', 'work_type', 'heart_disease', 'avg_glucose_level', 'bmi', 'smoking_status', 'Residence_type']
36
+
37
+ # Convert the input into a pandas DataFrame
38
+ input_df = pd.DataFrame([inputs], columns=input_labels)
39
+
40
+ # Predict the stroke probability
41
+ prediction = model.predict_proba(input_df)[0][1]
42
+
43
+ # Return the prediction
44
+ result = "The probability of stroke is {:.2f}%".format(prediction * 100) # to give a percentage
45
+ return result
46
+
47
+
48
+
49
+
50
+
51
+
52
+ input_labels = [
53
+ 'gender', 'age', 'hypertension', 'ever_married', 'work_type',
54
+ 'heart_disease', 'avg_glucose_level', 'bmi', 'smoking_status', 'Residence_type'
55
+ ]
56
  # Create the Gradio interface
57
  iface = gr.Interface(
58
  fn=predict,
59
  inputs=[
60
+ gr.components.Radio(choices=['Female', 'Male'], label="Gender"),
61
+ gr.components.Slider(label="Age"),
62
+ gr.components.Radio(choices=['Yes', 'No'], label="Hypertension"),
63
+ gr.components.Radio(choices=['Yes', 'No'], label="Ever Married"),
64
+ gr.components.Radio(choices=['Private', 'Self-employed', 'Govt_job', 'children', 'Never_worked'], label="Work Type"),
65
+ gr.components.Radio(choices=['Yes', 'No'], label="Heart Disease"),
66
+ gr.components.Number(label="Average Glucose Level"),
67
+ gr.components.Slider(label="BMI"),
68
+ gr.components.Radio(choices=['formerly smoked', 'never smoked', 'smokes', 'Unknown'], label="Smoking Status"),
69
+ gr.components.Radio(choices=['Urban', 'Rural'], label="Residence Type")
70
  ],
71
  outputs='text',
72
  title='Stroke Probability Predictor',
73
  description='Predicts the probability of having a stroke based on input features.'
74
  )
75
 
76
+
77
+ iface.launch()