SandyTheAdventurer commited on
Commit
53d0197
·
verified ·
1 Parent(s): 2946656

Changed EDA graphs

Browse files
Files changed (1) hide show
  1. main.py +10 -2
main.py CHANGED
@@ -23,7 +23,7 @@ dataset.drop(columns=['customerID'], inplace=True)
23
  # Encoding categorical variables and Scaling numerical variables
24
  encoder = LabelEncoder()
25
  scaler = StandardScaler()
26
- for column in dataset.select_dtypes(include=['int64', 'float64']).columns:
27
  dataset[column] = scaler.fit_transform(dataset[column].values.reshape(-1, 1))
28
  for column in dataset.select_dtypes(include=['object']).columns:
29
  dataset[column] = encoder.fit_transform(dataset[column])
@@ -45,7 +45,15 @@ plt.savefig("graphs/EDAGraphs/Heatmap.png")
45
 
46
  for column in dataset.columns:
47
  fig, ax = plt.subplots(figsize=(16, 10))
48
- sns.kdeplot(dataset[column],ax=ax)
 
 
 
 
 
 
 
 
49
  plt.savefig(f"graphs/EDAGraphs/{column}.png")
50
 
51
  # Splitting the dataset into training and testing sets
 
23
  # Encoding categorical variables and Scaling numerical variables
24
  encoder = LabelEncoder()
25
  scaler = StandardScaler()
26
+ for column in dataset.select_dtypes(include=['int64', 'float64']).columns.drop("SeniorCitizen"):
27
  dataset[column] = scaler.fit_transform(dataset[column].values.reshape(-1, 1))
28
  for column in dataset.select_dtypes(include=['object']).columns:
29
  dataset[column] = encoder.fit_transform(dataset[column])
 
45
 
46
  for column in dataset.columns:
47
  fig, ax = plt.subplots(figsize=(16, 10))
48
+ if column == "Churn":
49
+ sns.kdeplot(x="Churn", data=dataset)
50
+ plt.savefig(f"graphs/EDAGraphs/{column}.png")
51
+ continue
52
+ if column == "MonthlyCharges":
53
+ sns.violinplot(x="Churn", y=column, data=dataset)
54
+ plt.savefig(f"graphs/EDAGraphs/{column}.png")
55
+ continue
56
+ sns.barplot(x=column, y="Churn", data=dataset ,ax=ax)
57
  plt.savefig(f"graphs/EDAGraphs/{column}.png")
58
 
59
  # Splitting the dataset into training and testing sets