from modules.utils import * class Image2Line: def __init__(self, device, pretrained_model_dir): print("Initializing Image2Line") self.detector = MLSDdetector.from_pretrained(f'{pretrained_model_dir}/ControlNet') @prompts(name="Line Detection On Image", description="useful when you want to detect the straight line of the image. " "like: detect the straight lines of this image, or straight line detection on image, " "or peform straight line detection on this image, or detect the straight line image of this image. " "The input to this tool should be a string, representing the image_path") def inference(self, inputs): image = Image.open(inputs) mlsd = self.detector(image) updated_image_path = get_new_image_name(inputs, func_name="line-of") mlsd.save(updated_image_path) print(f"\nProcessed Image2Line, Input Image: {inputs}, Output Line: {updated_image_path}") return updated_image_path class LineText2Image: def __init__(self, device, pretrained_model_dir): print("Initializing LineText2Image to %s" % device) self.torch_dtype = torch.float16 if 'cuda' in device else torch.float32 self.controlnet = ControlNetModel.from_pretrained(f"{pretrained_model_dir}/sd-controlnet-mlsd", torch_dtype=self.torch_dtype) self.pipe = StableDiffusionControlNetPipeline.from_pretrained( f"{pretrained_model_dir}/stable-diffusion-v1-5", controlnet=self.controlnet, safety_checker=None, torch_dtype=self.torch_dtype ) self.pipe.scheduler = UniPCMultistepScheduler.from_config(self.pipe.scheduler.config) self.pipe.to(device) self.seed = -1 self.a_prompt = 'best quality, extremely detailed' self.n_prompt = 'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, ' \ 'fewer digits, cropped, worst quality, low quality' @prompts(name="Generate Image Condition On Line Image", description="useful when you want to generate a new real image from both the user desciption " "and a straight line image. " "like: generate a real image of a object or something from this straight line image, " "or generate a new real image of a object or something from this straight lines. " "The input to this tool should be a comma seperated string of two, " "representing the image_path and the user description. ") def inference(self, inputs): image_path, instruct_text = inputs.split(",")[0], ','.join(inputs.split(',')[1:]) image = Image.open(image_path) self.seed = random.randint(0, 65535) seed_everything(self.seed) prompt = instruct_text + ', ' + self.a_prompt image = self.pipe(prompt, image, num_inference_steps=20, eta=0.0, negative_prompt=self.n_prompt, guidance_scale=9.0).images[0] updated_image_path = get_new_image_name(image_path, func_name="line2image") image.save(updated_image_path) print(f"\nProcessed LineText2Image, Input Line: {image_path}, Input Text: {instruct_text}, " f"Output Text: {updated_image_path}") return updated_image_path