import argparse import os import time from os import path from safetensors.torch import load_file import huggingface_hub from huggingface_hub import hf_hub_download import os cache_path = path.join(path.dirname(path.abspath(__file__)), "models") os.environ["TRANSFORMERS_CACHE"] = cache_path os.environ["HF_HUB_CACHE"] = cache_path os.environ["HF_HOME"] = cache_path import spaces import gradio as gr import torch from diffusers import FluxPipeline torch.backends.cuda.matmul.allow_tf32 = True class timer: def __init__(self, method_name="timed process"): self.method = method_name def __enter__(self): self.start = time.time() print(f"{self.method} starts") def __exit__(self, exc_type, exc_val, exc_tb): end = time.time() print(f"{self.method} took {str(round(end - self.start, 2))}s") if not path.exists(cache_path): os.makedirs(cache_path, exist_ok=True) def load_and_fuse_lora_weights(pipe, lora_models): for repo, file_path, lora_scale in lora_models: lora_weights_path = hf_hub_download(repo_id=repo, filename=file_path) pipe.load_lora_weights(lora_weights_path) pipe.fuse_lora(lora_scale=lora_scale) # List of LoRA models and their corresponding scales lora_models = [ ("mrcuddle/live2d-model-maker", "LIVE2D-FLUX.safetensors", 0.125) ] pipe = FluxPipeline.from_pretrained("alfredplpl/flux.1-dev-modern-anime-full", torch_dtype=torch.bfloat16) # Load and fuse LoRA weights load_and_fuse_lora_weights(pipe, lora_models) pipe.to(device="cuda", dtype=torch.bfloat16) with gr.Blocks(theme=gr.themes.Soft()) as demo: gr.Markdown( """

Live2D Base Model Maker

The LoRA's *required* prompt is preloaded

""" ) with gr.Row(): with gr.Column(scale=3): with gr.Group(): prompt = gr.Textbox( label="Your Image Description", placeholder="Girl with Red Dragon Wings", lines=3 ) # Hidden textbox for the preset prompt preset_prompt = gr.Textbox( label="Preset Prompt", value="live2d,guijiaoxiansheng,separate hand,separate feet,separate head,multiple views,white background,magic particles, multiple references,color pallete reference,simple background,upper body,front,from side", visible=False ) with gr.Accordion("Advanced Settings", open=False): with gr.Group(): with gr.Row(): height = gr.Slider(label="Height", minimum=256, maximum=1152, step=64, value=1024) width = gr.Slider(label="Width", minimum=256, maximum=1152, step=64, value=1024) with gr.Row(): steps = gr.Slider(label="Inference Steps", minimum=5, maximum=25, step=1, value=8) scales = gr.Slider(label="Guidance Scale", minimum=0.0, maximum=10.0, step=1, value=3.5) seed = gr.Number(label="Seed (for reproducibility)", value=-1, precision=0) generate_btn = gr.Button("Generate Image", variant="primary", scale=1) with gr.Column(scale=4): output = gr.Image(label="Your Generated Image") @spaces.GPU def process_image(height, width, steps, scales, prompt, seed, preset_prompt): global pipe with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"): # Concatenate the preset prompt with the user's input prompt full_prompt = f"{preset_prompt} {prompt}" return pipe( prompt=[full_prompt], generator=torch.Generator().manual_seed(int(seed)), num_inference_steps=int(steps), guidance_scale=float(scales), height=int(height), width=int(width), max_sequence_length=256 ).images[0] generate_btn.click( process_image, inputs=[height, width, steps, scales, prompt, seed, preset_prompt], outputs=output ) if __name__ == "__main__": demo.launch()