import numpy as np
import pandas as pd

df = pd.read_json("data_set_50.json")

meme_attribute = {}
meme_filename = []
meme_list = []

for col in df.columns:
    name = df.loc["filename", col]
    name = name.replace(".jpg", "")
    name = name.replace("High-Quality-", "")
    attribute_tmp = df.loc["file_attributes", col]
    if attribute_tmp == {}:
        continue
    attribute_str = attribute_tmp['image_label'].strip().strip('"')
    cleaned_attribute = attribute_str.replace(',', '')
    file_name = df.loc["filename", col]
    meme_attribute[name] = cleaned_attribute
    meme_filename.append(file_name)
    meme_list.append(name)