beihai commited on
Commit
2ec0192
·
1 Parent(s): b967c55

Upload data.py

Browse files
Files changed (1) hide show
  1. data.py +71 -0
data.py ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import pandas as pd
2
+ import numpy as np
3
+ from sklearn import preprocessing
4
+ import streamlit as st
5
+ import joblib
6
+
7
+
8
+ def getDataSetOrigin():
9
+ dataSet = [
10
+ ["青绿", "蜷缩", "浊响", "清晰", "凹陷", "硬滑", 1],
11
+ ["乌黑", "蜷缩", "沉闷", "清晰", "凹陷", "硬滑", 1],
12
+ ["乌黑", "蜷缩", "浊响", "清晰", "凹陷", "硬滑", 1],
13
+ ["青绿", "蜷缩", "沉闷", "清晰", "凹陷", "硬滑", 1],
14
+ ["浅白", "蜷缩", "浊响", "清晰", "凹陷", "硬滑", 1],
15
+ ["青绿", "稍蜷", "浊响", "清晰", "稍凹", "软粘", 1],
16
+ ["乌黑", "稍蜷", "浊响", "稍糊", "稍凹", "软粘", 1],
17
+ ["乌黑", "稍蜷", "浊响", "清晰", "稍凹", "硬滑", 1],
18
+ ["乌黑", "稍蜷", "沉闷", "稍糊", "稍凹", "硬滑", 0],
19
+ ["青绿", "硬挺", "清脆", "清晰", "平坦", "软粘", 0],
20
+ ["浅白", "硬挺", "清脆", "模糊", "平坦", "硬滑", 0],
21
+ ["浅白", "蜷缩", "浊响", "模糊", "平坦", "软粘", 0],
22
+ ["青绿", "稍蜷", "浊响", "稍糊", "凹陷", "硬滑", 0],
23
+ ["浅白", "稍蜷", "沉闷", "稍糊", "凹陷", "硬滑", 0],
24
+ ["乌黑", "稍蜷", "浊响", "清晰", "稍凹", "软粘", 0],
25
+ ["浅白", "蜷缩", "浊响", "模糊", "平坦", "硬滑", 0],
26
+ ["青绿", "蜷缩", "沉闷", "稍糊", "稍凹", "硬滑", 0],
27
+ ]
28
+ features = [
29
+ "color",
30
+ "root",
31
+ "knocks",
32
+ "texture",
33
+ "navel",
34
+ "touch",
35
+ "label",
36
+ ]
37
+ dataSet = np.array(dataSet)
38
+ dfOrigin = pd.DataFrame(dataSet, columns=features)
39
+ return dfOrigin
40
+
41
+
42
+ def dataPreprocessing():
43
+ df = getDataSetOrigin()
44
+ for feature in df.columns[0:6]:
45
+ le = preprocessing.LabelEncoder()
46
+ le = le.fit(df[feature])
47
+ df[feature] = le.transform(df[feature])
48
+ joblib.dump(le, "./models/" + feature + "_LabelEncoder.model")
49
+ df["label"] = df["label"].astype(int)
50
+
51
+ return df
52
+
53
+
54
+ def inputData():
55
+ st.sidebar.subheader("请选择西瓜外观:sunglasses:")
56
+ color = st.sidebar.selectbox("色泽", ("青绿", "乌黑", "浅白"))
57
+ root = st.sidebar.selectbox("根蒂", ("蜷缩", "稍蜷", "硬挺"))
58
+ knocks = st.sidebar.selectbox("敲击", ("浊响", "沉闷", "清脆"))
59
+ texture = st.sidebar.selectbox("纹理", ("清晰", "稍糊", "模糊"))
60
+ navel = st.sidebar.selectbox("脐部", ("凹陷", "稍凹", "平坦"))
61
+ touch = st.sidebar.selectbox("触感", ("硬滑", "软粘"))
62
+ input = [[color, root, knocks, texture, navel, touch]]
63
+ features = ["color", "root", "knocks", "texture", "navel", "touch"]
64
+ np.array(input).reshape(1, 6)
65
+ df_input = pd.DataFrame(input, columns=features, index=None)
66
+
67
+ for feature in features[0:6]:
68
+ le = joblib.load("./models/" + feature + "_LabelEncoder.model")
69
+ df_input[feature] = le.transform(df_input[feature])
70
+
71
+ return df_input