| import numpy as np | |
| import pandas as pd | |
| df = pd.read_json("data_set_50.json") | |
| meme_attribute = {} | |
| meme_filename = [] | |
| meme_list = [] | |
| for col in df.columns: | |
| name = df.loc["filename", col] | |
| name = name.replace(".jpg", "") | |
| name = name.replace("High-Quality-", "") | |
| attribute_tmp = df.loc["file_attributes", col] | |
| if attribute_tmp == {}: | |
| continue | |
| attribute_str = attribute_tmp['image_label'].strip().strip('"') | |
| cleaned_attribute = attribute_str.replace(',', '') | |
| file_name = df.loc["filename", col] | |
| meme_attribute[name] = cleaned_attribute | |
| meme_filename.append(file_name) | |
| meme_list.append(name) |