Spaces:

shorthillstech
/

pybanking_value_prediction

Runtime error

App Files Files Community

pybanking_value_prediction / app.py

nikhil0nk

cleaning

bb0b18d over 3 years ago

raw

history blame contribute delete

3.45 kB

	import streamlit as st
	import streamlit.components.v1 as components
	import pandas as pd
	import pickle
	import matplotlib.pyplot as plt
	import pybanking
	from pybanking.value_prediction import model_value_prediction
	from pybanking.EDA import data_analysis
	import sklearn.metrics as metrics
	from mlxtend.plotting import plot_confusion_matrix
	import streamlit.components.v1 as components
	from sklearn.model_selection import train_test_split
	from PIL import Image
	from pycaret.regression import pull,predict_model


	st.set_page_config(page_title="Customer Value Prediction Model", layout="wide")

	col1,col2 = st.columns([1,2])

	with col1:
	image = Image.open('Shorthills.png')
	st.image(image)

	with col2:
	st.title('Customer Value Prediction Model')

	train_df= model_value_prediction.get_data()


	option2 = st.selectbox(
	'Which dataset would you like to use for prediction?',
	['Sample Dataset', 'Upload Custom']
	)

	if option2 == 'Upload Custom':
	file = st.file_uploader("Choose a file")
	if file is not None:
	#read csv
	train_df = pd.read_csv(file)
	else:
	st.warning("you need to upload a csv file.")

	st.subheader('This is the Selected Data')

	st.dataframe(train_df.head(5))

	analysis_class = data_analysis.Analysis()

	option3 = st.selectbox(
	'Select Exploratory Data Analysis type',
	['None', 'DataPrep', 'SweetViz', 'PandasProfiling']
	)

	if option3 == 'SweetViz':
	res = analysis_class.sweetviz_analysis(train_df)
	res.show_html(filepath='SweetViz.html', open_browser=True, layout='widescreen', scale=None)
	HtmlFile = open('SweetViz.html', 'r', encoding='utf-8')
	source_code = HtmlFile.read()
	with st.expander("See Report"):
	components.html(source_code, height=600, scrolling=True)

	elif option3 == 'DataPrep':
	res = analysis_class.dataprep_analysis(train_df)
	# res.show_browser()
	res.save('DataPrep.html')
	HtmlFile = open('DataPrep.html', 'r', encoding='utf-8')
	source_code = HtmlFile.read()
	with st.expander("See Report"):
	components.html(source_code, height=600, scrolling=True)

	elif option3 == 'PandasProfiling':
	res = analysis_class.pandas_analysis(train_df)
	res.to_file("PandasProfiling.html")
	HtmlFile = open('PandasProfiling.html', 'r', encoding='utf-8')
	source_code = HtmlFile.read()
	with st.expander("See Report"):
	components.html(source_code, height=600, scrolling=True)

	model_names = [
	"Logistic_Regression",
	"Support_Vector_Machine",
	"Support_Vector_Machine_Optimized",
	"Decision_Tree",
	"Neural_Network",
	"Random_Forest",
	"Pycaret_Best",
	"LGBM",
	"Lasso"
	]


	option = st.selectbox(
	'Select a model to be used',
	model_names
	)

	tr_df = model_value_prediction.important_feat(train_df,option)
	model = pickle.load(open(option+'.pkl', 'rb'))

	st.write("Model Loaded : ", option)

	train_X,test_X,train_y,dev_X,val_X,dev_y,val_y,test_y= model_value_prediction.preprocess_inputs(tr_df,option)

	model = model_value_prediction.train(tr_df,option)
	y_pred = model_value_prediction.predict(test_X,model,option)

	if option == "Pycaret_Best":
	predict_model(model)
	st.write("RMSLE Score:", pull()['RMSLE'][0])
	else:
	st.write("RMSLE Score:", metrics.mean_squared_log_error(test_y, y_pred, squared=False))
	st.write("Poisson Score:", metrics.mean_tweedie_deviance(test_y, y_pred))