professions-bovw-knn

Runtime error

Anonymous Authors

Update app.py

875e3fd over 1 year ago

5.28 kB

	import gradio as gr
	from datasets import load_from_disk
	import numpy as np
	import re


	adjectives = ['ambitious', 'assertive', 'committed', 'compassionate', 'confident', 'considerate', 'decisive', 'determined', 'emotional', 'gentle',
	'honest', 'intellectual', 'modest', 'no_adjective', 'outspoken', 'pleasant', 'self-confident', 'sensitive', 'stubborn', 'supportive', 'unreasonable']

	professions = ['CEO', 'IT_specialist', 'accountant', 'aerospace_engineer', 'aide', 'air_conditioning_installer', 'architect', 'artist', 'author',
	'baker', 'bartender', 'bus_driver', 'butcher', 'career_counselor', 'carpenter', 'carpet_installer', 'cashier', 'childcare_worker',
	'civil_engineer', 'claims_appraiser', 'cleaner', 'clergy', 'clerk', 'coach', 'community_manager', 'compliance_officer', 'computer_programmer',
	'computer_support_specialist', 'computer_systems_analyst', 'construction_worker', 'cook', 'correctional_officer', 'courier', 'credit_counselor',
	'customer_service_representative', 'data_entry_keyer', 'dental_assistant', 'dental_hygienist', 'dentist', 'designer', 'detective', 'director',
	'dishwasher', 'dispatcher', 'doctor', 'drywall_installer', 'electrical_engineer', 'electrician', 'engineer', 'event_planner', 'executive_assistant',
	'facilities_manager', 'farmer', 'fast_food_worker', 'file_clerk', 'financial_advisor', 'financial_analyst', 'financial_manager', 'firefighter',
	'fitness_instructor', 'graphic_designer', 'groundskeeper', 'hairdresser', 'head_cook', 'health_technician', 'host', 'hostess', 'industrial_engineer',
	'insurance_agent', 'interior_designer', 'interviewer', 'inventory_clerk', 'jailer', 'janitor', 'laboratory_technician', 'language_pathologist',
	'lawyer', 'librarian', 'logistician', 'machinery_mechanic', 'machinist', 'maid', 'manager', 'manicurist', 'market_research_analyst',
	'marketing_manager', 'massage_therapist', 'mechanic', 'mechanical_engineer', 'medical_records_specialist', 'mental_health_counselor',
	'metal_worker', 'mover', 'musician', 'network_administrator', 'nurse', 'nursing_assistant', 'nutritionist', 'occupational_therapist',
	'office_clerk', 'office_worker', 'painter', 'paralegal', 'payroll_clerk', 'pharmacist', 'pharmacy_technician', 'photographer',
	'physical_therapist', 'pilot', 'plane_mechanic', 'plumber', 'police_officer', 'postal_worker', 'printing_press_operator', 'producer',
	'psychologist', 'public_relations_specialist', 'purchasing_agent', 'radiologic_technician', 'real_estate_broker', 'receptionist',
	'repair_worker', 'roofer', 'sales_manager', 'salesperson', 'school_bus_driver', 'scientist', 'security_guard', 'sheet_metal_worker', 'singer',
	'social_assistant', 'social_worker', 'software_developer', 'stocker', 'supervisor', 'taxi_driver', 'teacher', 'teaching_assistant', 'teller',
	'therapist', 'tractor_operator', 'truck_driver', 'tutor', 'underwriter', 'veterinarian', 'waiter', 'waitress', 'welder', 'wholesale_buyer', 'writer']
	models = ['DallE', 'SD_14', 'SD_2']
	nos = [1,2,3,4,5,6,7,8,9,10]

	ds = load_from_disk("jobs")

	def get_nearest(adjective, profession, model, no):
	index=768
	df = ds.remove_columns(["image","image_path"]).to_pandas()
	index = np.load(f"indexes/knn_{index}_65.npy")
	ix = df.loc[(df['adjective'] == adjective) & (df['profession'] == profession) & (df['no'] == no) & (df['model'] == model)].index[0]
	image = ds.select([index[ix][0]])["image"][0]
	neighbors = ds.select(index[ix][1:25])
	neighbor_images = neighbors["image"]
	neighbor_captions = [caption.split("/")[-1] for caption in neighbors["image_path"]]
	# neighbor_captions = [' '.join(caption.split("_")[4:-3]) for caption in neighbor_captions]
	neighbor_models = neighbors["model"]
	neighbor_captions = [f"{re.split('Photo_portrait_of_an?_', a)[-1]} {b}" for a,b in zip(neighbor_captions,neighbor_models)]
	return image, list(zip(neighbor_images, neighbor_captions))

	with gr.Blocks() as demo:
	gr.Markdown("# BoVW Nearest Neighbors Explorer")
	gr.Markdown("### TF-IDF index of the _identities_ dataset of images generated by 3 models using a visual vocabulary of 10,752 words.")
	gr.Markdown("#### Choose one of the generated identity images to see its nearest neighbors according to a bag-of-visual-words model.")
	gr.HTML("""<span style="color:red">⚠️ <b>DISCLAIMER: the images displayed by this tool were generated by text-to-image models and may depict offensive stereotypes or contain explicit content.</b></span>""")
	with gr.Row():
	with gr.Column():
	model = gr.Radio(models, label="Model")
	adjective = gr.Radio(adjectives, label="Adjective")
	no = gr.Radio(nos, label="Image number")
	with gr.Column():
	profession = gr.Dropdown(professions, label="Profession")
	button = gr.Button(value="Get nearest neighbors")
	with gr.Row():
	image = gr.Image()
	gallery = gr.Gallery().style(grid=4)
	button.click(get_nearest, inputs=[adjective, profession, model, no], outputs=[image, gallery])
	demo.launch()