Attend-and-Excite

Sleeping

App Files Files Community

Attend-and-Excite / app.py

hysts HF staff

Use gr.on

eaf1941 about 1 year ago

raw

history blame

8.61 kB

	#!/usr/bin/env python

	from __future__ import annotations

	import os
	import random

	import gradio as gr
	import numpy as np
	import PIL.Image
	import spaces
	import torch
	from diffusers import StableDiffusionAttendAndExcitePipeline, StableDiffusionPipeline

	DESCRIPTION = """\
	# Attend-and-Excite

	This is a demo for [Attend-and-Excite](https://arxiv.org/abs/2301.13826).
	Attend-and-Excite performs attention-based generative semantic guidance to mitigate subject neglect in Stable Diffusion.
	Select a prompt and a set of indices matching the subjects you wish to strengthen (the `Check token indices` cell can help map between a word and its index).
	"""

	if not torch.cuda.is_available():
	DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"

	if torch.cuda.is_available():
	device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
	model_id = "CompVis/stable-diffusion-v1-4"
	ax_pipe = StableDiffusionAttendAndExcitePipeline.from_pretrained(model_id)
	ax_pipe.to(device)
	sd_pipe = StableDiffusionPipeline.from_pretrained(model_id)
	sd_pipe.to(device)


	MAX_INFERENCE_STEPS = 100
	MAX_SEED = np.iinfo(np.int32).max


	def randomize_seed_fn(seed: int, randomize_seed: bool) -> int:
	if randomize_seed:
	seed = random.randint(0, MAX_SEED)
	return seed


	def get_token_table(prompt: str) -> list[tuple[int, str]]:
	tokens = [ax_pipe.tokenizer.decode(t) for t in ax_pipe.tokenizer(prompt)["input_ids"]]
	tokens = tokens[1:-1]
	return list(enumerate(tokens, start=1))


	@spaces.GPU
	def run(
	prompt: str,
	indices_to_alter_str: str,
	seed: int = 0,
	apply_attend_and_excite: bool = True,
	num_inference_steps: int = 50,
	guidance_scale: float = 7.5,
	scale_factor: int = 20,
	thresholds: dict[int, float] = {
	10: 0.5,
	20: 0.8,
	},
	max_iter_to_alter: int = 25,
	) -> PIL.Image.Image:
	if num_inference_steps > MAX_INFERENCE_STEPS:
	raise gr.Error(f"Number of steps cannot exceed {MAX_INFERENCE_STEPS}.")

	generator = torch.Generator(device=device).manual_seed(seed)
	if apply_attend_and_excite:
	try:
	token_indices = list(map(int, indices_to_alter_str.split(",")))
	except Exception:
	raise ValueError("Invalid token indices.")
	out = ax_pipe(
	prompt=prompt,
	token_indices=token_indices,
	guidance_scale=guidance_scale,
	generator=generator,
	num_inference_steps=num_inference_steps,
	max_iter_to_alter=max_iter_to_alter,
	thresholds=thresholds,
	scale_factor=scale_factor,
	)
	else:
	out = sd_pipe(
	prompt=prompt,
	guidance_scale=guidance_scale,
	generator=generator,
	num_inference_steps=num_inference_steps,
	)
	return out.images[0]


	def process_example(
	prompt: str,
	indices_to_alter_str: str,
	seed: int,
	apply_attend_and_excite: bool,
	) -> tuple[list[tuple[int, str]], PIL.Image.Image]:
	token_table = get_token_table(prompt)
	result = run(
	prompt=prompt,
	indices_to_alter_str=indices_to_alter_str,
	seed=seed,
	apply_attend_and_excite=apply_attend_and_excite,
	)
	return token_table, result


	with gr.Blocks(css="style.css") as demo:
	gr.Markdown(DESCRIPTION)
	gr.DuplicateButton(
	value="Duplicate Space for private use",
	elem_id="duplicate-button",
	visible=os.getenv("SHOW_DUPLICATE_BUTTON") == "1",
	)

	with gr.Row():
	with gr.Column():
	prompt = gr.Text(
	label="Prompt",
	max_lines=1,
	placeholder="A pod of dolphins leaping out of the water in an ocean with a ship on the background",
	)
	with gr.Accordion(label="Check token indices", open=False):
	show_token_indices_button = gr.Button("Show token indices")
	token_indices_table = gr.Dataframe(label="Token indices", headers=["Index", "Token"], col_count=2)
	token_indices_str = gr.Text(
	label="Token indices (a comma-separated list indices of the tokens you wish to alter)",
	max_lines=1,
	placeholder="4,16",
	)
	apply_attend_and_excite = gr.Checkbox(label="Apply Attend-and-Excite", value=True)
	seed = gr.Slider(
	label="Seed",
	minimum=0,
	maximum=MAX_SEED,
	step=1,
	value=0,
	)
	randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
	num_inference_steps = gr.Slider(
	label="Number of inference steps",
	minimum=1,
	maximum=MAX_INFERENCE_STEPS,
	step=1,
	value=50,
	)
	guidance_scale = gr.Slider(
	label="Guidance scale",
	minimum=0,
	maximum=50,
	step=0.1,
	value=7.5,
	)
	run_button = gr.Button("Generate")
	with gr.Column():
	result = gr.Image(label="Result")

	with gr.Row():
	examples = [
	[
	"A mouse and a red car",
	"2,6",
	2098,
	True,
	],
	[
	"A mouse and a red car",
	"2,6",
	2098,
	False,
	],
	[
	"A horse and a dog",
	"2,5",
	123,
	True,
	],
	[
	"A horse and a dog",
	"2,5",
	123,
	False,
	],
	[
	"A painting of an elephant with glasses",
	"5,7",
	123,
	True,
	],
	[
	"A painting of an elephant with glasses",
	"5,7",
	123,
	False,
	],
	[
	"A playful kitten chasing a butterfly in a wildflower meadow",
	"3,6,10",
	123,
	True,
	],
	[
	"A playful kitten chasing a butterfly in a wildflower meadow",
	"3,6,10",
	123,
	False,
	],
	[
	"A grizzly bear catching a salmon in a crystal clear river surrounded by a forest",
	"2,6,15",
	123,
	True,
	],
	[
	"A grizzly bear catching a salmon in a crystal clear river surrounded by a forest",
	"2,6,15",
	123,
	False,
	],
	[
	"A pod of dolphins leaping out of the water in an ocean with a ship on the background",
	"4,16",
	123,
	True,
	],
	[
	"A pod of dolphins leaping out of the water in an ocean with a ship on the background",
	"4,16",
	123,
	False,
	],
	]
	gr.Examples(
	examples=examples,
	inputs=[
	prompt,
	token_indices_str,
	seed,
	apply_attend_and_excite,
	],
	outputs=[
	token_indices_table,
	result,
	],
	fn=process_example,
	cache_examples=os.getenv("CACHE_EXAMPLES") == "1",
	examples_per_page=20,
	)

	show_token_indices_button.click(
	fn=get_token_table,
	inputs=prompt,
	outputs=token_indices_table,
	queue=False,
	api_name="get-token-table",
	)

	gr.on(
	triggers=[prompt.submit, token_indices_str.submit, run_button.click],
	fn=randomize_seed_fn,
	inputs=[seed, randomize_seed],
	outputs=seed,
	queue=False,
	api_name=False,
	).then(
	fn=get_token_table,
	inputs=prompt,
	outputs=token_indices_table,
	queue=False,
	api_name=False,
	).then(
	fn=run,
	inputs=[
	prompt,
	token_indices_str,
	seed,
	apply_attend_and_excite,
	num_inference_steps,
	guidance_scale,
	],
	outputs=result,
	api_name="run",
	)

	if __name__ == "__main__":
	demo.queue(max_size=20).launch()