Upload 8 files
Browse files- CBT.csv +0 -0
- app.py +33 -0
- classfication auc.jpg +0 -0
- classfication auc.png +0 -0
- precision recall curve.png +0 -0
- predicted values.png +0 -0
- receiver operating character example.png +0 -0
- xgboost log error.png +0 -0
CBT.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
app.py
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import streamlit as st
|
| 2 |
+
import pandas as pd
|
| 3 |
+
import matplotlib.pyplot as plt
|
| 4 |
+
from sklearn.impute import SimpleImputer
|
| 5 |
+
from imblearn.over_sampling import SMOTE
|
| 6 |
+
from imblearn.under_sampling import RandomUnderSampler
|
| 7 |
+
import numpy as np
|
| 8 |
+
from sklearn.pipeline import Pipeline
|
| 9 |
+
from imblearn.pipeline import make_pipeline
|
| 10 |
+
import imblearn
|
| 11 |
+
import openpyxl
|
| 12 |
+
|
| 13 |
+
st.title('Huayra app')
|
| 14 |
+
|
| 15 |
+
# 读取 Excel 文件
|
| 16 |
+
df = pd.read_csv(r'D:/vscodeim/ML0517/CBT.csv')
|
| 17 |
+
df1 = df.drop('UserID',axis=1)
|
| 18 |
+
|
| 19 |
+
st.write("# <center><span style='font-size:24px'>Here is the DataFrame after cleaning</span></center>", unsafe_allow_html=True)
|
| 20 |
+
st.dataframe(df1)
|
| 21 |
+
|
| 22 |
+
st.image('D:/vscodeim/ML0517/xgboost log error.png')
|
| 23 |
+
st.image('D:/vscodeim/ML0517/classfication auc.png')
|
| 24 |
+
|
| 25 |
+
st.write("Higher AUC values indicate that the model performs better in distinguishing between positive and negative samples.")
|
| 26 |
+
st.write("We get an AUC of **1** for the training set and **0.9985630707839712** for the test set. This indicates that the model performs very well.")
|
| 27 |
+
st.image('D:/vscodeim/ML0517/precision recall curve.png')
|
| 28 |
+
st.image('D:/vscodeim/ML0517/receiver operating character example.png')
|
| 29 |
+
|
| 30 |
+
st.write("The P-R Curve (Precision-Recall Curve) is a curve used to evaluate the performance of a binary classification model, which shows the precision of the model under different recall rates.")
|
| 31 |
+
|
| 32 |
+
st.write("Ideally, the P-R curve should be as close to the upper right as possible, which means that the model maintains a high precision at high recall.")
|
| 33 |
+
st.image('D:/vscodeim/ML0517/predicted values.png')
|
classfication auc.jpg
ADDED
|
classfication auc.png
ADDED
|
precision recall curve.png
ADDED
|
predicted values.png
ADDED
|
receiver operating character example.png
ADDED
|
xgboost log error.png
ADDED
|