File size: 609 Bytes
0d253c0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
import pandas as pd

# Read the CSV file
df = pd.read_csv('enron_spam_data.csv')

# Filter the desired columns
df_filtered = df[['Spam/Ham', 'Message']]

# Rename the column headers
df_filtered.rename(columns={'Spam/Ham': 'label', 'Message': 'text'}, inplace=True)

# Drop rows with empty message values
df_filtered.dropna(subset=['text'], inplace=True)

# Convert cells to a single line
df_filtered['text'] = df_filtered['text'].apply(lambda x: x.replace('\n', ' ') if isinstance(x, str) else x)

# Save the filtered and modified DataFrame to a new CSV file
df_filtered.to_csv('enron_spam.csv', index=False)