import pandas as pd def preprocess(df,region_df): # filtering for summer olympics df = df[df['Season'] == 'Summer'] # merge with region_df df = df.merge(region_df, on='NOC', how='left') # dropping duplicates df.drop_duplicates(inplace=True) # one hot encoding medals df = pd.concat([df, pd.get_dummies(df['Medal'])], axis=1) return df