Spaces:

Mrmusculo
/

background

Runtime error

App Files Files Community

Mrmusculo commited on Aug 7, 2023

Commit

3a0bfe5

•

1 Parent(s): 08c4f37

Create app.py

Browse files

Files changed (1) hide show

app.py +220 -0

app.py ADDED Viewed

	@@ -0,0 +1,220 @@

+import pickle
+import pandas as pd
+import numpy as np
+import requests
+import io
+import os
+import cv2
+import gdown
+import tempfile
+from PIL import Image, ImageDraw, ImageFont
+import PIL
+from transparent_background import Remover
+import torch
+import time
+import gradio as gr
+from PIL import Image
+import requests
+from io import BytesIO
+class BackgroundRemover(Remover):
+    def __init__(self, model_bytes, device=None):
+        """
+        model_bytes: model weights as bytes (downloaded from "https://drive.google.com/file/d/13oBl5MTVcWER3YU4fSxW3ATlVfueFQPY/view?usp=share_link")
+        device     : (default cuda:0 if available) specifying device for computation
+        """
+        self.model_path = None
+        with tempfile.NamedTemporaryFile(suffix=".pth", delete=False) as tmp_file:
+            tmp_file.write(model_bytes)
+            self.model_path = tmp_file.name
+        # get the path of the script that defines this class
+        script_path = os.path.abspath(__file__)
+        # construct the path to the arial.ttf file relative to the script location
+        font_path = os.path.join(os.path.dirname(script_path), "arial.ttf")
+        self.font_path = font_path
+        super().__init__(fast=False, jit=False, device=device, ckpt=self.model_path)
+    def __del__(self):
+        if self.model_path is not None and os.path.exists(self.model_path):
+            os.remove(self.model_path)
+    def download(self):
+        pass
+    def predict(self, image, comparison=False, extra=""):
+        s = time.time()
+        prediction = self.raw_predict(image)
+        e = time.time()
+        #print(f"predict time {e-s:.4f}")
+        if not comparison:
+            return prediction
+        else:
+            return self.compare(image, prediction, e-s, extra)
+    def raw_predict(self, image, empty_cache_after_prediction=False):
+        t1 = time.time()
+        out = self.process(image)
+        t2 = time.time()
+        prediction = Image.fromarray(out)
+        # Crea una nueva imagen RGB con un fondo blanco del mismo tamaño que la original
+        new_image = Image.new("RGB", prediction.size, (255, 255, 255))
+        # Combina las dos imágenes, reemplazando los píxeles transparentes con blanco
+        new_image.paste(prediction, mask=prediction.split()[3])
+        t3 = time.time()
+        if empty_cache_after_prediction and "cuda" in self.device:
+            torch.cuda.empty_cache()
+        t4 = time.time()
+        #print(f"{(t2-t1)*1000:.4f} {(t3-t2)*1000:.4f} {(t4-t3)*1000:.4f}")
+        return new_image
+    def compare(self, image1, image2, prediction_time, extra_info=""):
+        extra = 80
+        concatenated_image = Image.new('RGB', (image1.width + image2.width, image1.height + extra), (255, 255, 255))
+        concatenated_image.paste(image1, (0, 0+extra))
+        concatenated_image.paste(image2, (image1.width, 0+extra))
+        draw = ImageDraw.Draw(concatenated_image)
+        font = ImageFont.truetype(self.font_path, 20)
+        draw.text((20, 0), f"size:{image1.size}\nmodel time:{prediction_time:.2f}s\n{extra_info}", fill=(0, 0, 0), font=font)
+        return concatenated_image
+    def read_image_from_url(self, url):
+        response = requests.get(url)
+        image = Image.open(io.BytesIO(response.content)).convert("RGB")
+        return image
+    def read_image_from_file(self, file_name):
+        image = Image.open(file_name).convert("RGB")
+        return image
+    def read_image_form_bytes(self, image_bytes):
+        # Convertir los bytes en imagen
+        image = Image.open(io.BytesIO(image_bytes))
+        return image
+    def image_to_bytes(self, image, format="JPEG"):
+        image_bytes = io.BytesIO()
+        image_rgb = image.convert('RGB')
+        image_rgb.save(image_bytes, format=format)
+        image_bytes = image_bytes.getvalue()
+        return image_bytes
+    @classmethod
+    def create_instance_from_model_url(cls, url):
+        model_bytes = BackgroundRemover.download_model_from_url(url)
+        return cls(model_bytes)
+    @classmethod
+    def create_instance_from_model_file(cls, file_path, device=None):
+        with open(file_path, 'rb') as f:
+            model_bytes = f.read()
+        return cls(model_bytes, device)
+    @classmethod
+    def download_model_from_url(cls, url):
+        with io.BytesIO() as file:
+            gdown.download(url, file, quiet=False, fuzzy=True)
+            # Get the contents of the file as bytes
+            file.seek(0)
+            model_bytes = file.read()
+        return model_bytes
+def show_image(url: str):
+    response = requests.get(url)
+    img = Image.open(BytesIO(response.content))
+    return img
+def do_predictions(url):
+    response = requests.get(url)
+    img = Image.open(BytesIO(response.content))
+    device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+    transform_model = BackgroundRemover.create_instance_from_model_file("model_weights.pth")
+    # Set up data transformations
+    data_transforms = {
+        'train': transforms.Compose([
+            #transforms.Resize(512), #256
+            #transforms.CenterCrop(480), # 224
+            #transforms.Resize((256, 256)),
+            transforms.Resize((384, 384)),
+            transforms.ToTensor(),
+            transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
+        ]),
+        'val': transforms.Compose([
+            #transforms.Resize(512), #256
+            #transforms.CenterCrop(480), # 224
+            #transforms.Resize((256, 256)),
+            transforms.Resize((384, 284)),
+            transforms.ToTensor(),
+            transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
+        ]),
+    }
+    # Crear un modelo con la misma arquitectura
+    detect_model = models.resnet50(weights=None)  # Cambiar 'pretrained' por 'weights'
+    num_ftrs = detect_model.fc.in_features
+    num_classes = 2
+    detect_model.fc = nn.Linear(num_ftrs, num_classes)
+    detect_model = detect_model.to(device)
+    # Cargar los pesos guardados
+    model_weights_path = 'white_background_detection/resnet50_finetuned_weights.pth'
+    detect_model.load_state_dict(torch.load(model_weights_path))
+    # Cambiar el modelo a modo de evaluación
+    detect_model.eval()
+    print("")
+    prediction, predicted_probability, inference_time = predict_single_image_detection(img, detect_model, data_transforms['val'], "cuda:0")
+    if prediction=="real":
+        out = transform_model.predict(img, comparison=False)
+        return prediction, predicted_probability, img, out,
+    else:
+        return prediction, predicted_probability, img, None
+iface = gr.Interface(fn=do_predictions, inputs="text", outputs=["text", "text", "image", "image"], examples=[["https://http2.mlstatic.com/D_NQ_NP_2X_823376-MLU29226703936_012019-F.webp"],
+                                                                                                             ["https://http2.mlstatic.com/D_781350-MLA53584851929_022023-F.jpg"]])
+#iface.outputs[0].set_title("Predicción")
+#iface.outputs[1].set_title("Clase")
+#iface.outputs[2].set_title("Probabilidad")
+iface.launch(share=True)