Spaces:

vamcrizer
/

memegen

Sleeping

memegen / preprocess.py

vam

Upload preprocess.py

9e7ea31 verified about 2 months ago

685 Bytes

	import numpy as np
	import pandas as pd

	df = pd.read_json("/kaggle/input/50memejson/data_set_50.json")

	meme_attribute = {}
	meme_filename = []
	meme_list = []

	for col in df.columns:
	name = df.loc["filename", col]
	name = name.replace(".jpg", "")
	name = name.replace("High-Quality-", "")
	attribute_tmp = df.loc["file_attributes", col]
	if attribute_tmp == {}:
	continue
	attribute_str = attribute_tmp['image_label'].strip().strip('"')
	cleaned_attribute = attribute_str.replace(',', '')
	file_name = df.loc["filename", col]
	meme_attribute[name] = cleaned_attribute
	meme_filename.append(file_name)
	meme_list.append(name)