HarleDane's picture
Update app.py
4c9c809 verified
# Import the libraries
import joblib
from sklearn.datasets import fetch_openml
from sklearn.preprocessing import StandardScaler, OneHotEncoder
from sklearn.compose import make_column_transformer
from sklearn.pipeline import make_pipeline
from sklearn.model_selection import train_test_split, RandomizedSearchCV
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score, classification_report
# Run the training script placed in the same directory as app.py
# The training script will train and persist a linear regression
# model with the filename 'model.joblib'
# Run training script
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
import joblib
# Choose and instantiate RandomForestRegressor model
model = RandomForestRegressor()
# Train the model using the training data
model.fit(X_train, y_train)
# Save the trained model to a file (e.g., 'insurance_model.joblib')
joblib.dump(model, 'model.joblib')
# Load the freshly trained model from disk
model = joblib.load('model.joblib')
# Prepare the logging functionality
log_file = Path("logs/") / f"data_{uuid.uuid4()}.json"
log_folder = log_file.parent
log_file.parent.mkdir(exist_ok=True)
#######################################################################################################################
scheduler = CommitScheduler(
repo_id="-----------", # provide a name "insurance-charge-mlops-logs" for the repo_id
repo_type="dataset",
folder_path=log_folder,
path_in_repo="data",
every=2
)
# Define the predict function which will take features, convert to dataframe and make predictions using the saved model
# the functions runs when 'Submit' is clicked or when a API request is made
import pandas as pd
import joblib
# Assuming 'model' is a trained model loaded using joblib.load()
def predict(age, sex, bmi, children, smoker, region):
"""Predicts insurance charges based on customer features.
Args:
age (int): Age of the customer.
sex (int): Gender of the customer (0 for female, 1 for male).
bmi (float): Body Mass Index of the customer.
children (int): Number of children the customer has.
smoker (int): Smoking status of the customer (0 for yes, 1 for no).
region (int): Region of the customer (1-4 representing different regions).
Returns:
float: Predicted insurance charges.
"""
# Create a DataFrame with the input features
input_data = pd.DataFrame({
'age': [age],
'sex': [sex],
'bmi': [bmi],
'children': [children],
'smoker': [smoker],
'region': [region]
})
# Make the prediction using the loaded model
prediction = model.predict(input_data)
# Return the prediction
return prediction[0]
# While the prediction is made, log both the inputs and outputs to a log file
# While writing to the log file, ensure that the commit scheduler is locked to avoid parallel
# access
with scheduler.lock:
with log_file.open("a") as f:
f.write(json.dumps(
{
'age': age,
'bmi': bmi,
'children': children,
'sex': sex,
'smoker': smoker,
'region': region,
'prediction': prediction[0]
}
))
f.write("\n")
return prediction[0]
# Set up UI components for input and output
import gradio as gr
age = gr.inputs.Slider(minimum=18, maximum=64, default=30, step=1, label="Age")
sex = gr.inputs.Radio(["female", "male"], type)
# Create the gradio interface, make title "HealthyLife Insurance Charge Prediction"
import gradio as gr
# ... (previous code for model training and predict function) ...
# Set up UI components for input and output
age = gr.inputs.Slider(minimum=18, maximum=64, default=30, step=1, label="Age")
sex = gr.inputs.Radio(["female", "male"], type="value", default="female", label="Sex") # Corrected type
bmi = gr.inputs.Number(default=25, label="BMI")
children = gr.inputs.Slider(minimum=0, maximum=5, default=0, step=1, label="Children")
smoker = gr.inputs.Radio(["yes", "no"], type="value", default="no", label="Smoker") # Corrected type
region = gr.inputs.Dropdown(["southwest", "southeast", "northwest", "northeast"], type="value", default="southwest", label="Region") # Corrected type
# Create the Gradio interface
demo = gr.Interface(
fn=predict,
inputs=[age, sex, bmi, children, smoker, region],
outputs="number",
title="HealthyLife Insurance Charge Prediction"
)
# Launch with a load balancer
demo.queue()
demo.launch(share=False)