import gradio as gr import asyncio from threading import RLock from pathlib import Path from huggingface_hub import InferenceClient import os HF_TOKEN = os.environ.get("HF_TOKEN") if os.environ.get("HF_TOKEN") else None # If private or gated models aren't used, ENV setting is unnecessary. server_timeout = 600 inference_timeout = 300 lock = RLock() loaded_models = {} model_info_dict = {} def to_list(s): return [x.strip() for x in s.split(",")] def list_sub(a, b): return [e for e in a if e not in b] def list_uniq(l): return sorted(set(l), key=l.index) def is_repo_name(s): import re return re.fullmatch(r'^[^/]+?/[^/]+?$', s) def get_status(model_name: str): from huggingface_hub import InferenceClient client = InferenceClient(token=HF_TOKEN, timeout=10) return client.get_model_status(model_name) def is_loadable(model_name: str, force_gpu: bool = False): try: status = get_status(model_name) except Exception as e: print(e) print(f"Couldn't load {model_name}.") return False gpu_state = isinstance(status.compute_type, dict) and "gpu" in status.compute_type.keys() if status is None or status.state not in ["Loadable", "Loaded"] or (force_gpu and not gpu_state): print(f"Couldn't load {model_name}. Model state:'{status.state}', GPU:{gpu_state}") return status is not None and status.state in ["Loadable", "Loaded"] and (not force_gpu or gpu_state) def find_model_list(author: str="", tags: list[str]=[], not_tag="", sort: str="last_modified", limit: int=30, force_gpu=False, check_status=False): from huggingface_hub import HfApi api = HfApi(token=HF_TOKEN) default_tags = ["diffusers"] if not sort: sort = "last_modified" limit = limit * 20 if check_status and force_gpu else limit * 5 models = [] try: model_infos = api.list_models(author=author, task="text-to-image", tags=list_uniq(default_tags + tags), cardData=True, sort=sort, limit=limit) except Exception as e: print(f"Error: Failed to list models.") print(e) return models for model in model_infos: if not model.private and not model.gated or HF_TOKEN is not None: loadable = is_loadable(model.id, force_gpu) if check_status else True if not_tag and not_tag in model.tags or not loadable: continue models.append(model.id) if len(models) == limit: break return models def get_t2i_model_info_dict(repo_id: str): from huggingface_hub import HfApi api = HfApi(token=HF_TOKEN) info = {"md": "None"} try: if not is_repo_name(repo_id) or not api.repo_exists(repo_id=repo_id): return info model = api.model_info(repo_id=repo_id, token=HF_TOKEN) except Exception as e: print(f"Error: Failed to get {repo_id}'s info.") print(e) return info if model.private or model.gated and HF_TOKEN is None: return info try: tags = model.tags except Exception as e: print(e) return info if not 'diffusers' in model.tags: return info if 'diffusers:FluxPipeline' in tags: info["ver"] = "FLUX.1" elif 'diffusers:StableDiffusionXLPipeline' in tags: info["ver"] = "SDXL" elif 'diffusers:StableDiffusionPipeline' in tags: info["ver"] = "SD1.5" elif 'diffusers:StableDiffusion3Pipeline' in tags: info["ver"] = "SD3" else: info["ver"] = "Other" info["url"] = f"https://huggingface.co/{repo_id}/" info["tags"] = model.card_data.tags if model.card_data and model.card_data.tags else [] info["downloads"] = model.downloads info["likes"] = model.likes info["last_modified"] = model.last_modified.strftime("lastmod: %Y-%m-%d") un_tags = ['text-to-image', 'stable-diffusion', 'stable-diffusion-api', 'safetensors', 'stable-diffusion-xl'] descs = [info["ver"]] + list_sub(info["tags"], un_tags) + [f'DLs: {info["downloads"]}'] + [f'❤: {info["likes"]}'] + [info["last_modified"]] info["md"] = f'Model Info: {", ".join(descs)} [Model Repo]({info["url"]})' return info def rename_image(image_path: str | None, model_name: str, save_path: str | None = None): from PIL import Image, ImageFile ImageFile.LOAD_TRUNCATED_IMAGES = True from datetime import datetime, timezone, timedelta if image_path is None: return None dt_now = datetime.now(timezone(timedelta(hours=9))) filename = f"{model_name.split('/')[-1]}_{dt_now.strftime('%Y%m%d_%H%M%S')}.png" try: if Path(image_path).exists(): png_path = "image.png" Image.open(image_path).convert('RGBA').save(png_path, "PNG") if save_path is not None: new_path = str(Path(png_path).resolve().rename(Path(save_path).resolve())) else: new_path = str(Path(png_path).resolve().rename(Path(filename).resolve())) return new_path else: return None except Exception as e: print(e) return None def save_gallery(image_path: str | None, images: list[tuple] | None): if images is None: images = [] files = [i[0] for i in images] if image_path is None: return images, files files.insert(0, str(image_path)) images.insert(0, (str(image_path), Path(image_path).stem)) return images, files # https://github.com/gradio-app/gradio/blob/main/gradio/external.py # https://huggingface.co/docs/huggingface_hub/package_reference/inference_client from typing import Literal def load_from_model(model_name: str, hf_token: str | Literal[False] | None = None): import httpx import huggingface_hub from gradio.exceptions import ModelNotFoundError, TooManyRequestsError model_url = f"https://huggingface.co/{model_name}" api_url = f"https://api-inference.huggingface.co/models/{model_name}" print(f"Fetching model from: {model_url}") headers = ({} if hf_token in [False, None] else {"Authorization": f"Bearer {hf_token}"}) response = httpx.request("GET", api_url, headers=headers) if response.status_code != 200: raise ModelNotFoundError( f"Could not find model: {model_name}. If it is a private or gated model, please provide your Hugging Face access token (https://huggingface.co/settings/tokens) as the argument for the `hf_token` parameter." ) p = response.json().get("pipeline_tag") if p != "text-to-image": raise ModelNotFoundError(f"This model isn't for text-to-image or unsupported: {model_name}.") headers["X-Wait-For-Model"] = "true" client = huggingface_hub.InferenceClient(model=model_name, headers=headers, token=hf_token, timeout=server_timeout) inputs = gr.components.Textbox(label="Input") outputs = gr.components.Image(label="Output") fn = client.text_to_image def query_huggingface_inference_endpoints(*data, **kwargs): try: data = fn(*data, **kwargs) # type: ignore except huggingface_hub.utils.HfHubHTTPError as e: if "429" in str(e): raise TooManyRequestsError() from e except Exception as e: raise Exception(e) return data interface_info = { "fn": query_huggingface_inference_endpoints, "inputs": inputs, "outputs": outputs, "title": model_name, } return gr.Interface(**interface_info) def load_model(model_name: str): global loaded_models global model_info_dict if model_name in loaded_models.keys(): return loaded_models[model_name] try: loaded_models[model_name] = load_from_model(model_name, hf_token=HF_TOKEN) print(f"Loaded: {model_name}") except Exception as e: if model_name in loaded_models.keys(): del loaded_models[model_name] print(f"Failed to load: {model_name}") print(e) return None try: model_info_dict[model_name] = get_t2i_model_info_dict(model_name) print(f"Assigned: {model_name}") except Exception as e: if model_name in model_info_dict.keys(): del model_info_dict[model_name] print(f"Failed to assigned: {model_name}") print(e) return loaded_models[model_name] def load_model_api(model_name: str): global loaded_models global model_info_dict if model_name in loaded_models.keys(): return loaded_models[model_name] try: client = InferenceClient(timeout=5) status = client.get_model_status(model_name, token=HF_TOKEN) if status is None or status.framework != "diffusers" or status.state not in ["Loadable", "Loaded"]: print(f"Failed to load by API: {model_name}") return None else: loaded_models[model_name] = InferenceClient(model_name, token=HF_TOKEN, timeout=server_timeout) print(f"Loaded by API: {model_name}") except Exception as e: if model_name in loaded_models.keys(): del loaded_models[model_name] print(f"Failed to load by API: {model_name}") print(e) return None try: model_info_dict[model_name] = get_t2i_model_info_dict(model_name) print(f"Assigned by API: {model_name}") except Exception as e: if model_name in model_info_dict.keys(): del model_info_dict[model_name] print(f"Failed to assigned by API: {model_name}") print(e) return loaded_models[model_name] def load_models(models: list): for model in models: load_model(model) positive_prefix = { "Pony": to_list("score_9, score_8_up, score_7_up"), "Pony Anime": to_list("source_anime, anime, score_9, score_8_up, score_7_up"), } positive_suffix = { "Common": to_list("highly detailed, masterpiece, best quality, very aesthetic, absurdres"), "Anime": to_list("anime artwork, anime style, studio anime, highly detailed"), } negative_prefix = { "Pony": to_list("score_6, score_5, score_4"), "Pony Anime": to_list("score_6, score_5, score_4, source_pony, source_furry, source_cartoon"), "Pony Real": to_list("score_6, score_5, score_4, source_anime, source_pony, source_furry, source_cartoon"), } negative_suffix = { "Common": to_list("lowres, (bad), bad hands, bad feet, text, error, fewer, extra, missing, worst quality, jpeg artifacts, low quality, watermark, unfinished, displeasing, oldest, early, chromatic aberration, signature, extra digits, artistic error, username, scan, [abstract]"), "Pony Anime": to_list("busty, ugly face, mutated hands, low res, blurry face, black and white, the simpsons, overwatch, apex legends"), "Pony Real": to_list("ugly, airbrushed, simple background, cgi, cartoon, anime"), } positive_all = negative_all = [] for k, v in (positive_prefix | positive_suffix).items(): positive_all = positive_all + v + [s.replace("_", " ") for s in v] positive_all = list_uniq(positive_all) for k, v in (negative_prefix | negative_suffix).items(): negative_all = negative_all + v + [s.replace("_", " ") for s in v] positive_all = list_uniq(positive_all) def recom_prompt(prompt: str = "", neg_prompt: str = "", pos_pre: list = [], pos_suf: list = [], neg_pre: list = [], neg_suf: list = []): def flatten(src): return [item for row in src for item in row] prompts = to_list(prompt) neg_prompts = to_list(neg_prompt) prompts = list_sub(prompts, positive_all) neg_prompts = list_sub(neg_prompts, negative_all) last_empty_p = [""] if not prompts and type != "None" else [] last_empty_np = [""] if not neg_prompts and type != "None" else [] prefix_ps = flatten([positive_prefix.get(s, []) for s in pos_pre]) suffix_ps = flatten([positive_suffix.get(s, []) for s in pos_suf]) prefix_nps = flatten([negative_prefix.get(s, []) for s in neg_pre]) suffix_nps = flatten([negative_suffix.get(s, []) for s in neg_suf]) prompt = ", ".join(list_uniq(prefix_ps + prompts + suffix_ps) + last_empty_p) neg_prompt = ", ".join(list_uniq(prefix_nps + neg_prompts + suffix_nps) + last_empty_np) return prompt, neg_prompt recom_prompt_type = { "None": ([], [], [], []), "Auto": ([], [], [], []), "Common": ([], ["Common"], [], ["Common"]), "Animagine": ([], ["Common", "Anime"], [], ["Common"]), "Pony": (["Pony"], ["Common"], ["Pony"], ["Common"]), "Pony Anime": (["Pony", "Pony Anime"], ["Common", "Anime"], ["Pony", "Pony Anime"], ["Common", "Pony Anime"]), "Pony Real": (["Pony"], ["Common"], ["Pony", "Pony Real"], ["Common", "Pony Real"]), } enable_auto_recom_prompt = False def insert_recom_prompt(prompt: str = "", neg_prompt: str = "", type: str = "None"): global enable_auto_recom_prompt if type == "Auto": enable_auto_recom_prompt = True else: enable_auto_recom_prompt = False pos_pre, pos_suf, neg_pre, neg_suf = recom_prompt_type.get(type, ([], [], [], [])) return recom_prompt(prompt, neg_prompt, pos_pre, pos_suf, neg_pre, neg_suf) def set_recom_prompt_preset(type: str = "None"): pos_pre, pos_suf, neg_pre, neg_suf = recom_prompt_type.get(type, ([], [], [], [])) return pos_pre, pos_suf, neg_pre, neg_suf def get_recom_prompt_type(): type = list(recom_prompt_type.keys()) type.remove("Auto") return type def get_positive_prefix(): return list(positive_prefix.keys()) def get_positive_suffix(): return list(positive_suffix.keys()) def get_negative_prefix(): return list(negative_prefix.keys()) def get_negative_suffix(): return list(negative_suffix.keys()) def get_tag_type(pos_pre: list = [], pos_suf: list = [], neg_pre: list = [], neg_suf: list = []): tag_type = "danbooru" words = pos_pre + pos_suf + neg_pre + neg_suf for word in words: if "Pony" in word: tag_type = "e621" break return tag_type def get_model_info_md(model_name: str): if model_name in model_info_dict.keys(): return model_info_dict[model_name].get("md", "") def change_model(model_name: str): load_model_api(model_name) return get_model_info_md(model_name) def warm_model(model_name: str): model = load_model_api(model_name) if model: try: print(f"Warming model: {model_name}") infer_body(model, " ") except Exception as e: print(e) # https://huggingface.co/docs/api-inference/detailed_parameters # https://huggingface.co/docs/huggingface_hub/package_reference/inference_client def infer_body(client: InferenceClient | gr.Interface | object, prompt: str, neg_prompt: str | None = None, height: int | None = None, width: int | None = None, steps: int | None = None, cfg: int | None = None, seed: int = -1): png_path = "image.png" kwargs = {} if height is not None and height >= 256: kwargs["height"] = height if width is not None and width >= 256: kwargs["width"] = width if steps is not None and steps >= 1: kwargs["num_inference_steps"] = steps if cfg is not None and cfg > 0: cfg = kwargs["guidance_scale"] = cfg if seed >= 0: kwargs["seed"] = seed try: if isinstance(client, InferenceClient): image = client.text_to_image(prompt=prompt, negative_prompt=neg_prompt, **kwargs, token=HF_TOKEN) elif isinstance(client, gr.Interface): image = client.fn(prompt=prompt, negative_prompt=neg_prompt, **kwargs, token=HF_TOKEN) else: return None if isinstance(image, tuple): return None image.save(png_path) return str(Path(png_path).resolve()) except Exception as e: print(e) raise Exception(e) async def infer(model_name: str, prompt: str, neg_prompt: str | None = None, height: int | None = None, width: int | None = None, steps: int | None = None, cfg: int | None = None, seed: int = -1, save_path: str | None = None, timeout: float = inference_timeout): import random noise = "" if seed < 0: rand = random.randint(1, 500) for i in range(rand): noise += " " model = load_model(model_name) if not model: return None task = asyncio.create_task(asyncio.to_thread(infer_body, model, f"{prompt} {noise}", neg_prompt, height, width, steps, cfg, seed)) await asyncio.sleep(0) try: result = await asyncio.wait_for(task, timeout=timeout) except asyncio.TimeoutError as e: print(e) print(f"Task timed out: {model_name}") if not task.done(): task.cancel() result = None raise Exception(f"Task timed out: {model_name}") except Exception as e: print(e) if not task.done(): task.cancel() result = None raise Exception(e) if task.done() and result is not None: with lock: image = rename_image(result, model_name, save_path) return image return None # https://github.com/aio-libs/pytest-aiohttp/issues/8 # also AsyncInferenceClient is buggy. def infer_fn(model_name: str, prompt: str, neg_prompt: str | None = None, height: int | None = None, width: int | None = None, steps: int | None = None, cfg: int | None = None, seed: int = -1, pos_pre: list = [], pos_suf: list = [], neg_pre: list = [], neg_suf: list = [], save_path: str | None = None): if model_name == 'NA': return None try: loop = asyncio.get_running_loop() except Exception: loop = asyncio.new_event_loop() try: prompt, neg_prompt = recom_prompt(prompt, neg_prompt, pos_pre, pos_suf, neg_pre, neg_suf) result = loop.run_until_complete(infer(model_name, prompt, neg_prompt, height, width, steps, cfg, seed, save_path, inference_timeout)) except (Exception, asyncio.CancelledError) as e: print(e) print(f"Task aborted: {model_name}, Error: {e}") result = None raise gr.Error(f"Task aborted: {model_name}, Error: {e}") finally: loop.close() return result def infer_rand_fn(model_name_dummy: str, prompt: str, neg_prompt: str | None = None, height: int | None = None, width: int | None = None, steps: int | None = None, cfg: int | None = None, seed: int = -1, pos_pre: list = [], pos_suf: list = [], neg_pre: list = [], neg_suf: list = [], save_path: str | None = None): import random if model_name_dummy == 'NA': return None random.seed() model_name = random.choice(list(loaded_models.keys())) try: loop = asyncio.get_running_loop() except Exception: loop = asyncio.new_event_loop() try: prompt, neg_prompt = recom_prompt(prompt, neg_prompt, pos_pre, pos_suf, neg_pre, neg_suf) result = loop.run_until_complete(infer(model_name, prompt, neg_prompt, height, width, steps, cfg, seed, save_path, inference_timeout)) except (Exception, asyncio.CancelledError) as e: print(e) print(f"Task aborted: {model_name}, Error: {e}") result = None raise gr.Error(f"Task aborted: {model_name}, Error: {e}") finally: loop.close() return result