Olympic_data_analysis / preprocessor.py
Prathamesh1420's picture
Upload 7 files
8b2b7fb verified
raw
history blame contribute delete
382 Bytes
import pandas as pd
def preprocess(df,region_df):
# filtering for summer olympics
df = df[df['Season'] == 'Summer']
# merge with region_df
df = df.merge(region_df, on='NOC', how='left')
# dropping duplicates
df.drop_duplicates(inplace=True)
# one hot encoding medals
df = pd.concat([df, pd.get_dummies(df['Medal'])], axis=1)
return df