Spaces:

VikramSingh178
/

picpilot-server

Paused

App Files Files Community

VikramSingh178 commited on 15 days ago

Commit

40de55c

•

1 Parent(s): b427e12

chore: Add augment_image function to utils.py

Browse files

Files changed (4) hide show

api/routers/painting.py +31 -49
ui/__pycache__/ui.cpython-311.pyc +0 -0
ui/ui.py +66 -50
ui/utils.py +27 -0

api/routers/painting.py CHANGED Viewed

@@ -12,7 +12,7 @@ from hydra import compose, initialize
 from async_batcher.batcher import AsyncBatcher
 import json
 from functools import lru_cache
 pl.seed_everything(42)
 router = APIRouter()
@@ -31,6 +31,7 @@ def load_pipeline_wrapper():
     """
     pipeline = load_pipeline(cfg.model, accelerator(), enable_compile=True)
     return pipeline
 inpainting_pipeline = load_pipeline_wrapper()
 class InpaintingRequest(BaseModel):
@@ -44,8 +45,7 @@ class InpaintingRequest(BaseModel):
     guidance_scale: float = Field(..., description="Guidance scale for inference")
     mode: str = Field(..., description="Mode for output ('b64_json' or 's3_json')")
     num_images: int = Field(..., description="Number of images to generate")
-    use_augmentation: bool = Field(True, description="Whether to use image augmentation")
 class InpaintingBatchRequestModel(BaseModel):
     """
     Model representing a batch request for inpainting inference.
@@ -68,35 +68,14 @@ async def save_image(image: UploadFile) -> str:
         f.write(await image.read())
     return file_path
-def augment_image(image_path, target_width, target_height, roi_scale, segmentation_model_name, detection_model_name):
-    """
-    Augment an image by extending its dimensions and generating masks.
-    Args:
-        image_path (str): Path to the image file.
-        target_width (int): Target width for augmentation.
-        target_height (int): Target height for augmentation.
-        roi_scale (float): Scale factor for region of interest.
-        segmentation_model_name (str): Name of the segmentation model.
-        detection_model_name (str): Name of the detection model.
-    Returns:
-        Tuple[Image.Image, Image.Image]: Augmented image and inverted mask.
-    """
-    image = Image.open(image_path)
-    image_augmentation = ImageAugmentation(target_width, target_height, roi_scale)
-    image = image_augmentation.extend_image(image)
-    mask = image_augmentation.generate_mask_from_bbox(image, segmentation_model_name, detection_model_name)
-    inverted_mask = image_augmentation.invert_mask(mask)
-    return image, inverted_mask
-def run_inference(cfg, image_path: str, request: InpaintingRequest):
     """
     Run inference using an inpainting pipeline on an image.
     Args:
         cfg (dict): Configuration dictionary.
         image_path (str): Path to the image file.
         request (InpaintingRequest): Pydantic model containing inference parameters.
     Returns:
@@ -105,17 +84,8 @@ def run_inference(cfg, image_path: str, request: InpaintingRequest):
     Raises:
         ValueError: If an invalid mode is provided.
     """
-    if request.use_augmentation:
-        image, mask_image = augment_image(image_path,
-                                          cfg['target_width'],
-                                          cfg['target_height'],
-                                          cfg['roi_scale'],
-                                          cfg['segmentation_model'],
-                                          cfg['detection_model'])
-    else:
-        image = Image.open(image_path)
-        mask_image = None
     painting_pipeline = AutoPaintingPipeline(
         pipeline=inpainting_pipeline,
         image=image,
@@ -137,26 +107,33 @@ def run_inference(cfg, image_path: str, request: InpaintingRequest):
         raise ValueError("Invalid mode. Supported modes are 'b64_json' and 's3_json'.")
 class InpaintingBatcher(AsyncBatcher):
-    async def process_batch(self, batch: Tuple[List[str], List[InpaintingRequest]]) -> List[Dict[str, Any]]:
         """
         Process a batch of images and requests for inpainting inference.
         Args:
-            batch (Tuple[List[str], List[InpaintingRequest]]): Tuple of image paths and corresponding requests.
         Returns:
             List[Dict[str, Any]]: List of resulting images in the specified mode ('b64_json' or 's3_json').
         """
-        image_paths, requests = batch
         results = []
-        for image_path, request in zip(image_paths, requests):
-            result = run_inference(cfg, image_path, request)
-            results.append(result)
         return results
 @router.post("/inpainting")
 async def inpainting_inference(
     image: UploadFile = File(...),
     request_data: str = Form(...),
 ):
     """
@@ -164,6 +141,7 @@ async def inpainting_inference(
     Args:
         image (UploadFile): Uploaded image file.
         request_data (str): JSON string of the request parameters.
     Returns:
@@ -174,9 +152,10 @@ async def inpainting_inference(
     """
     try:
         image_path = await save_image(image)
         request_dict = json.loads(request_data)
         request = InpaintingRequest(**request_dict)
-        result = run_inference(cfg, image_path, request)
         return result
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
@@ -184,6 +163,7 @@ async def inpainting_inference(
 @router.post("/inpainting/batch")
 async def inpainting_batch_inference(
     images: List[UploadFile] = File(...),
     request_data: str = Form(...),
 ):
     """
@@ -191,6 +171,7 @@ async def inpainting_batch_inference(
     Args:
         images (List[UploadFile]): List of uploaded image files.
         request_data (str): JSON string of the request parameters.
     Returns:
@@ -204,13 +185,14 @@ async def inpainting_batch_inference(
         batch_request = InpaintingBatchRequestModel(**request_dict)
         requests = batch_request.requests
-        if len(images) != len(requests):
-            raise HTTPException(status_code=400, detail="The number of images and requests must match.")
         batcher = InpaintingBatcher(max_batch_size=64)
-        image_paths = [await save_image(image) for image in images]
-        results = batcher.process_batch((image_paths, requests))
         return results
     except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))

 from async_batcher.batcher import AsyncBatcher
 import json
 from functools import lru_cache
+import asyncio
 pl.seed_everything(42)
 router = APIRouter()
     """
     pipeline = load_pipeline(cfg.model, accelerator(), enable_compile=True)
     return pipeline
 inpainting_pipeline = load_pipeline_wrapper()
 class InpaintingRequest(BaseModel):
     guidance_scale: float = Field(..., description="Guidance scale for inference")
     mode: str = Field(..., description="Mode for output ('b64_json' or 's3_json')")
     num_images: int = Field(..., description="Number of images to generate")
 class InpaintingBatchRequestModel(BaseModel):
     """
     Model representing a batch request for inpainting inference.
         f.write(await image.read())
     return file_path
+def run_inference(cfg, image_path: str, mask_image_path: str, request: InpaintingRequest):
     """
     Run inference using an inpainting pipeline on an image.
     Args:
         cfg (dict): Configuration dictionary.
         image_path (str): Path to the image file.
+        mask_image_path (str): Path to the mask image file.
         request (InpaintingRequest): Pydantic model containing inference parameters.
     Returns:
     Raises:
         ValueError: If an invalid mode is provided.
     """
+    image = Image.open(image_path)
+    mask_image = Image.open(mask_image_path)
     painting_pipeline = AutoPaintingPipeline(
         pipeline=inpainting_pipeline,
         image=image,
         raise ValueError("Invalid mode. Supported modes are 'b64_json' and 's3_json'.")
 class InpaintingBatcher(AsyncBatcher):
+    def __init__(self, max_batch_size: int):
+        super().__init__(max_batch_size)
+    async def process_batch(self, batch: Tuple[List[str], List[str], List[InpaintingRequest]]) -> List[Dict[str, Any]]:
         """
         Process a batch of images and requests for inpainting inference.
         Args:
+            batch (Tuple[List[str], List[str], List[InpaintingRequest]]): Tuple of image paths, mask image paths, and corresponding requests.
         Returns:
             List[Dict[str, Any]]: List of resulting images in the specified mode ('b64_json' or 's3_json').
         """
+        image_paths, mask_image_paths, requests = batch
         results = []
+        for image_path, mask_image_path, request in zip(image_paths, mask_image_paths, requests):
+            try:
+                result = run_inference(cfg, image_path, mask_image_path, request)
+                results.append(result)
+            except Exception as e:
+                results.append({"error": str(e)})
         return results
 @router.post("/inpainting")
 async def inpainting_inference(
     image: UploadFile = File(...),
+    mask_image: UploadFile = File(...),
     request_data: str = Form(...),
 ):
     """
     Args:
         image (UploadFile): Uploaded image file.
+        mask_image (UploadFile): Uploaded mask image file.
         request_data (str): JSON string of the request parameters.
     Returns:
     """
     try:
         image_path = await save_image(image)
+        mask_image_path = await save_image(mask_image)
         request_dict = json.loads(request_data)
         request = InpaintingRequest(**request_dict)
+        result = run_inference(cfg, image_path, mask_image_path, request)
         return result
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 @router.post("/inpainting/batch")
 async def inpainting_batch_inference(
     images: List[UploadFile] = File(...),
+    mask_images: List[UploadFile] = File(...),
     request_data: str = Form(...),
 ):
     """
     Args:
         images (List[UploadFile]): List of uploaded image files.
+        mask_images (List[UploadFile]): List of uploaded mask image files.
         request_data (str): JSON string of the request parameters.
     Returns:
         batch_request = InpaintingBatchRequestModel(**request_dict)
         requests = batch_request.requests
+        if len(images) != len(requests) or len(images) != len(mask_images):
+            raise HTTPException(status_code=400, detail="The number of images, mask images, and requests must match.")
         batcher = InpaintingBatcher(max_batch_size=64)
+        image_paths = await asyncio.gather(*[save_image(image) for image in images])
+        mask_image_paths = await asyncio.gather(*[save_image(mask_image) for mask_image in mask_images])
+        results = await batcher.process_batch((image_paths, mask_image_paths, requests))
         return results
     except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))

ui/__pycache__/ui.cpython-311.pyc ADDED Viewed

Binary file (9.18 kB). View file

ui/ui.py CHANGED Viewed

@@ -1,16 +1,15 @@
 import gradio as gr
 import requests
-from pydantic import BaseModel
 from diffusers.utils import load_image
 from io import BytesIO
 sdxl_inference_endpoint = 'https://vikramsingh178-picpilot-server.hf.space/api/v1/product-diffusion/sdxl_v0_lora_inference'
 sdxl_batch_inference_endpoint = 'https://vikramsingh178-picpilot-server.hf.space/api/v1/product-diffusion/sdxl_v0_lora_inference/batch'
 kandinsky_inpainting_inference = 'https://vikramsingh178-picpilot-server.hf.space/api/v1/product-diffusion/inpainting'
-# Define the InpaintingRequest model
 class InputRequest(BaseModel):
     prompt: str
     num_inference_steps: int
@@ -20,15 +19,15 @@ class InputRequest(BaseModel):
     mode: str
 class InpaintingRequest(BaseModel):
-    prompt: str
-    negative_prompt: str
-    num_inference_steps: int
-    strength: float
-    guidance_scale: float
-    mode: str
 async def generate_sdxl_lora_image(prompt, negative_prompt, num_inference_steps, guidance_scale, num_images, mode):
-    # Prepare the payload for SDXL LORA API
     payload = InputRequest(
         prompt=prompt,
         negative_prompt=negative_prompt,
@@ -44,24 +43,46 @@ async def generate_sdxl_lora_image(prompt, negative_prompt, num_inference_steps,
     image = load_image(url)
     return image
-def generate_outpainting(prompt, negative_prompt, num_inference_steps, strength, guidance_scale, mode, image):
-    # Convert the image to bytes
     img_byte_arr = BytesIO()
-    image.save(img_byte_arr, format='PNG')
     img_byte_arr = img_byte_arr.getvalue()
     # Prepare the payload for multipart/form-data
     files = {
         'image': ('image.png', img_byte_arr, 'image/png'),
-        'prompt': (None, prompt),
-        'negative_prompt': (None, negative_prompt),
-        'num_inference_steps': (None, str(num_inference_steps)),
-        'strength': (None, str(strength)),
-        'guidance_scale': (None, str(guidance_scale)),
-        'mode': (None, mode)
     }
     response = requests.post(kandinsky_inpainting_inference, files=files)
     response.raise_for_status()
@@ -70,44 +91,39 @@ def generate_outpainting(prompt, negative_prompt, num_inference_steps, strength,
     image = load_image(url)
     return image
 with gr.Blocks(theme='VikramSingh178/Webui-Theme') as demo:
     with gr.Tab("SdxL-Lora"):
-       with gr.Row():
             with gr.Column():
-              with gr.Group():
-                prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here")
-                negative_prompt = gr.Textbox(label="Negative Prompt", placeholder="Enter negative prompt here")
-                num_inference_steps = gr.Slider(minimum=1, maximum=1000, step=1, value=20, label="Inference Steps")
-                guidance_scale = gr.Slider(minimum=1.0, maximum=10.0, step=0.1, value=7.5, label="Guidance Scale")
-                num_images = gr.Slider(minimum=1, maximum=10, step=1, value=1, label="Number of Images")
-                mode = gr.Dropdown(choices=["s3_json", "b64_json"], value="s3_json", label="Mode")
-                generate_button = gr.Button("Generate Image",variant='primary')
             with gr.Column(scale=1):
-                image_preview = gr.Image(label="Generated Image",show_download_button=True,show_share_button=True,container=True)
                 generate_button.click(generate_sdxl_lora_image, inputs=[prompt, negative_prompt, num_inference_steps, guidance_scale, num_images, mode], outputs=[image_preview])
-    with gr.Tab("Generate AI Background"):
         with gr.Row():
             with gr.Column():
-              with gr.Group():
-                image_input = gr.Image(type="pil", label="Upload Image")
-                prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here")
-                negative_prompt = gr.Textbox(label="Negative Prompt", placeholder="Enter negative prompt here")
-                num_inference_steps = gr.Slider(minimum=1, maximum=500, step=1, value=20, label="Inference Steps")
-                guidance_scale = gr.Slider(minimum=1.0, maximum=10.0, step=0.1, value=7.5, label="Guidance Scale")
-                strength = gr.Slider(minimum=0.1, maximum=1, step=0.1, value=1, label="Strength")
-                mode = gr.Dropdown(choices=["s3_json", "b64_json"], value="s3_json", label="Mode")
-                generate_button = gr.Button("Generate Background", variant='primary')
             with gr.Column(scale=1):
-                image_preview = gr.Image(label="Image", show_download_button=True, show_share_button=True, container=True)
-                generate_button.click(generate_outpainting, inputs=[prompt, negative_prompt, num_inference_steps, strength, guidance_scale, mode, image_input], outputs=[image_preview])
-demo.launch()

 import gradio as gr
 import requests
+from pydantic import BaseModel, Field
 from diffusers.utils import load_image
 from io import BytesIO
+import json
+import numpy as np
 sdxl_inference_endpoint = 'https://vikramsingh178-picpilot-server.hf.space/api/v1/product-diffusion/sdxl_v0_lora_inference'
 sdxl_batch_inference_endpoint = 'https://vikramsingh178-picpilot-server.hf.space/api/v1/product-diffusion/sdxl_v0_lora_inference/batch'
 kandinsky_inpainting_inference = 'https://vikramsingh178-picpilot-server.hf.space/api/v1/product-diffusion/inpainting'
 class InputRequest(BaseModel):
     prompt: str
     num_inference_steps: int
     mode: str
 class InpaintingRequest(BaseModel):
+    prompt: str = Field(..., description="Prompt text for inference")
+    negative_prompt: str = Field(..., description="Negative prompt text for inference")
+    num_inference_steps: int = Field(..., description="Number of inference steps")
+    strength: float = Field(..., description="Strength of the inference")
+    guidance_scale: float = Field(..., description="Guidance scale for inference")
+    mode: str = Field(..., description="Mode for output ('b64_json' or 's3_json')")
+    num_images: int = Field(..., description="Number of images to generate")
 async def generate_sdxl_lora_image(prompt, negative_prompt, num_inference_steps, guidance_scale, num_images, mode):
     payload = InputRequest(
         prompt=prompt,
         negative_prompt=negative_prompt,
     image = load_image(url)
     return image
+def process_masked_image(img):
+    base_image = img["image"]
+    mask = img["mask"]
+    # Convert mask to binary (0 or 255)
+    mask = np.where(mask > 0, 255, 0).astype(np.uint8)
+    return base_image, mask
+def generate_outpainting(prompt, negative_prompt, num_inference_steps, strength, guidance_scale, mode, num_images, masked_image):
+    base_image, mask = process_masked_image(masked_image)
+    # Convert the images to bytes
     img_byte_arr = BytesIO()
+    base_image.save(img_byte_arr, format='PNG')
     img_byte_arr = img_byte_arr.getvalue()
+    mask_byte_arr = BytesIO()
+    mask_image = gr.processing_utils.encode_pil_to_base64(mask)
+    mask_byte_arr = mask_image.getvalue()
     # Prepare the payload for multipart/form-data
     files = {
         'image': ('image.png', img_byte_arr, 'image/png'),
+        'mask_image': ('mask.png', mask_byte_arr, 'image/png'),
     }
+    # Prepare the request data
+    request_data = InpaintingRequest(
+        prompt=prompt,
+        negative_prompt=negative_prompt,
+        num_inference_steps=num_inference_steps,
+        strength=strength,
+        guidance_scale=guidance_scale,
+        mode=mode,
+        num_images=num_images
+    ).dict()
+    # Add the JSON-encoded request data to the files dictionary
+    files['request_data'] = ('request_data.json', json.dumps(request_data), 'application/json')
     response = requests.post(kandinsky_inpainting_inference, files=files)
     response.raise_for_status()
     image = load_image(url)
     return image
 with gr.Blocks(theme='VikramSingh178/Webui-Theme') as demo:
     with gr.Tab("SdxL-Lora"):
+        with gr.Row():
             with gr.Column():
+                with gr.Group():
+                    prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here")
+                    negative_prompt = gr.Textbox(label="Negative Prompt", placeholder="Enter negative prompt here")
+                    num_inference_steps = gr.Slider(minimum=1, maximum=1000, step=1, value=20, label="Inference Steps")
+                    guidance_scale = gr.Slider(minimum=1.0, maximum=10.0, step=0.1, value=7.5, label="Guidance Scale")
+                    num_images = gr.Slider(minimum=1, maximum=10, step=1, value=1, label="Number of Images")
+                    mode = gr.Dropdown(choices=["s3_json", "b64_json"], value="s3_json", label="Mode")
+                    generate_button = gr.Button("Generate Image", variant='primary')
             with gr.Column(scale=1):
+                image_preview = gr.Image(label="Generated Image", show_download_button=True, show_share_button=True, container=True)
                 generate_button.click(generate_sdxl_lora_image, inputs=[prompt, negative_prompt, num_inference_steps, guidance_scale, num_images, mode], outputs=[image_preview])
+    with gr.Tab("Inpainting"):
         with gr.Row():
             with gr.Column():
+                with gr.Group():
+                    masked_image = gr.ImageMask(label="Upload Image and Draw Mask")
+                    prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here")
+                    negative_prompt = gr.Textbox(label="Negative Prompt", placeholder="Enter negative prompt here")
+                    num_inference_steps = gr.Slider(minimum=1, maximum=100, step=1, value=20, label="Inference Steps")
+                    strength = gr.Slider(minimum=0.1, maximum=1, step=0.1, value=0.8, label="Strength")
+                    guidance_scale = gr.Slider(minimum=1.0, maximum=10.0, step=0.1, value=7.5, label="Guidance Scale")
+                    num_images = gr.Slider(minimum=1, maximum=10, step=1, value=1, label="Number of Images")
+                    mode = gr.Dropdown(choices=["s3_json", "b64_json"], value="s3_json", label="Mode")
+                    generate_button = gr.Button("Generate Inpainting", variant='primary')
             with gr.Column(scale=1):
+                image_preview = gr.Image(label="Inpainted Image", show_download_button=True, show_share_button=True, container=True)
+                generate_button.click(generate_outpainting, inputs=[prompt, negative_prompt, num_inference_steps, strength, guidance_scale, mode, num_images, masked_image], outputs=[image_preview])
+demo.launch()

ui/utils.py ADDED Viewed

	@@ -0,0 +1,27 @@

+from scripts.api_utils import ImageAugmentation
+from PIL import Image
+def augment_image(image_path, target_width, target_height, roi_scale, segmentation_model_name, detection_model_name):
+    """
+    Augment an image by extending its dimensions and generating masks.
+    Args:
+        image_path (str): Path to the image file.
+        target_width (int): Target width for augmentation.
+        target_height (int): Target height for augmentation.
+        roi_scale (float): Scale factor for region of interest.
+        segmentation_model_name (str): Name of the segmentation model.
+        detection_model_name (str): Name of the detection model.
+    Returns:
+        Tuple[Image.Image, Image.Image]: Augmented image and inverted mask.
+    """
+    image = Image.open(image_path)
+    image_augmentation = ImageAugmentation(target_width, target_height, roi_scale)
+    image = image_augmentation.extend_image(image)
+    mask = image_augmentation.generate_mask_from_bbox(image, segmentation_model_name, detection_model_name)
+    inverted_mask = image_augmentation.invert_mask(mask)
+    return image, inverted_mask