Anonymous Authors
Update app.py
875e3fd
import gradio as gr
from datasets import load_from_disk
import numpy as np
import re
adjectives = ['ambitious', 'assertive', 'committed', 'compassionate', 'confident', 'considerate', 'decisive', 'determined', 'emotional', 'gentle',
'honest', 'intellectual', 'modest', 'no_adjective', 'outspoken', 'pleasant', 'self-confident', 'sensitive', 'stubborn', 'supportive', 'unreasonable']
professions = ['CEO', 'IT_specialist', 'accountant', 'aerospace_engineer', 'aide', 'air_conditioning_installer', 'architect', 'artist', 'author',
'baker', 'bartender', 'bus_driver', 'butcher', 'career_counselor', 'carpenter', 'carpet_installer', 'cashier', 'childcare_worker',
'civil_engineer', 'claims_appraiser', 'cleaner', 'clergy', 'clerk', 'coach', 'community_manager', 'compliance_officer', 'computer_programmer',
'computer_support_specialist', 'computer_systems_analyst', 'construction_worker', 'cook', 'correctional_officer', 'courier', 'credit_counselor',
'customer_service_representative', 'data_entry_keyer', 'dental_assistant', 'dental_hygienist', 'dentist', 'designer', 'detective', 'director',
'dishwasher', 'dispatcher', 'doctor', 'drywall_installer', 'electrical_engineer', 'electrician', 'engineer', 'event_planner', 'executive_assistant',
'facilities_manager', 'farmer', 'fast_food_worker', 'file_clerk', 'financial_advisor', 'financial_analyst', 'financial_manager', 'firefighter',
'fitness_instructor', 'graphic_designer', 'groundskeeper', 'hairdresser', 'head_cook', 'health_technician', 'host', 'hostess', 'industrial_engineer',
'insurance_agent', 'interior_designer', 'interviewer', 'inventory_clerk', 'jailer', 'janitor', 'laboratory_technician', 'language_pathologist',
'lawyer', 'librarian', 'logistician', 'machinery_mechanic', 'machinist', 'maid', 'manager', 'manicurist', 'market_research_analyst',
'marketing_manager', 'massage_therapist', 'mechanic', 'mechanical_engineer', 'medical_records_specialist', 'mental_health_counselor',
'metal_worker', 'mover', 'musician', 'network_administrator', 'nurse', 'nursing_assistant', 'nutritionist', 'occupational_therapist',
'office_clerk', 'office_worker', 'painter', 'paralegal', 'payroll_clerk', 'pharmacist', 'pharmacy_technician', 'photographer',
'physical_therapist', 'pilot', 'plane_mechanic', 'plumber', 'police_officer', 'postal_worker', 'printing_press_operator', 'producer',
'psychologist', 'public_relations_specialist', 'purchasing_agent', 'radiologic_technician', 'real_estate_broker', 'receptionist',
'repair_worker', 'roofer', 'sales_manager', 'salesperson', 'school_bus_driver', 'scientist', 'security_guard', 'sheet_metal_worker', 'singer',
'social_assistant', 'social_worker', 'software_developer', 'stocker', 'supervisor', 'taxi_driver', 'teacher', 'teaching_assistant', 'teller',
'therapist', 'tractor_operator', 'truck_driver', 'tutor', 'underwriter', 'veterinarian', 'waiter', 'waitress', 'welder', 'wholesale_buyer', 'writer']
models = ['DallE', 'SD_14', 'SD_2']
nos = [1,2,3,4,5,6,7,8,9,10]
ds = load_from_disk("jobs")
def get_nearest(adjective, profession, model, no):
index=768
df = ds.remove_columns(["image","image_path"]).to_pandas()
index = np.load(f"indexes/knn_{index}_65.npy")
ix = df.loc[(df['adjective'] == adjective) & (df['profession'] == profession) & (df['no'] == no) & (df['model'] == model)].index[0]
image = ds.select([index[ix][0]])["image"][0]
neighbors = ds.select(index[ix][1:25])
neighbor_images = neighbors["image"]
neighbor_captions = [caption.split("/")[-1] for caption in neighbors["image_path"]]
# neighbor_captions = [' '.join(caption.split("_")[4:-3]) for caption in neighbor_captions]
neighbor_models = neighbors["model"]
neighbor_captions = [f"{re.split('Photo_portrait_of_an?_', a)[-1]} {b}" for a,b in zip(neighbor_captions,neighbor_models)]
return image, list(zip(neighbor_images, neighbor_captions))
with gr.Blocks() as demo:
gr.Markdown("# BoVW Nearest Neighbors Explorer")
gr.Markdown("### TF-IDF index of the _identities_ dataset of images generated by 3 models using a visual vocabulary of 10,752 words.")
gr.Markdown("#### Choose one of the generated identity images to see its nearest neighbors according to a bag-of-visual-words model.")
gr.HTML("""<span style="color:red">⚠️ <b>DISCLAIMER: the images displayed by this tool were generated by text-to-image models and may depict offensive stereotypes or contain explicit content.</b></span>""")
with gr.Row():
with gr.Column():
model = gr.Radio(models, label="Model")
adjective = gr.Radio(adjectives, label="Adjective")
no = gr.Radio(nos, label="Image number")
with gr.Column():
profession = gr.Dropdown(professions, label="Profession")
button = gr.Button(value="Get nearest neighbors")
with gr.Row():
image = gr.Image()
gallery = gr.Gallery().style(grid=4)
button.click(get_nearest, inputs=[adjective, profession, model, no], outputs=[image, gallery])
demo.launch()