Spaces:

svjack
/

BRIA-RMBG-2.0-Video

Running

App Files Files Community

svjack commited on Nov 16, 2024

Commit

abe5686

verified ·

1 Parent(s): 5c7858a

Upload 8 files

Browse files

Files changed (9) hide show

.gitattributes +1 -0
300_A_car_is_running_on_the_road.mp4 +0 -0
A_Terracotta_Warrior_is_skateboarding_9033688.mp4 +0 -0
app.py +151 -0
giraffe.jpg +0 -0
image_app.py +89 -0
pexels-cottonbro-5319934.mp4 +3 -0
requirements.txt +19 -0
video_script.py +78 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+pexels-cottonbro-5319934.mp4 filter=lfs diff=lfs merge=lfs -text

300_A_car_is_running_on_the_road.mp4 ADDED Viewed

Binary file (186 kB). View file

A_Terracotta_Warrior_is_skateboarding_9033688.mp4 ADDED Viewed

Binary file (138 kB). View file

app.py ADDED Viewed

	@@ -0,0 +1,151 @@

+import os
+import gradio as gr
+from gradio_imageslider import ImageSlider
+from loadimg import load_img
+import spaces
+from transformers import AutoModelForImageSegmentation
+import torch
+from torchvision import transforms
+from PIL import Image, ImageChops
+from moviepy.editor import VideoFileClip, ImageSequenceClip
+import numpy as np
+from tqdm import tqdm
+from uuid import uuid1
+# Check CUDA availability
+if torch.cuda.is_available():
+    device = "cuda"
+else:
+    device = "cpu"
+torch.set_float32_matmul_precision(["high", "highest"][0])
+# Load the model
+birefnet = AutoModelForImageSegmentation.from_pretrained(
+    "briaai/RMBG-2.0", trust_remote_code=True
+)
+birefnet.to(device)
+transform_image = transforms.Compose(
+    [
+        transforms.Resize((1024, 1024)),
+        transforms.ToTensor(),
+        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
+    ]
+)
+output_folder = 'output_images'
+if not os.path.exists(output_folder):
+    os.makedirs(output_folder)
+def fn(image):
+    im = load_img(image, output_type="pil")
+    im = im.convert("RGB")
+    origin = im.copy()
+    image = process(im)
+    image_path = os.path.join(output_folder, "no_bg_image.png")
+    image.save(image_path)
+    return (image, origin), image_path
+@spaces.GPU
+def process(image):
+    image_size = image.size
+    input_images = transform_image(image).unsqueeze(0).to(device)
+    # Prediction
+    with torch.no_grad():
+        preds = birefnet(input_images)[-1].sigmoid().cpu()
+    pred = preds[0].squeeze()
+    pred_pil = transforms.ToPILImage()(pred)
+    mask = pred_pil.resize(image_size)
+    image.putalpha(mask)
+    return image
+def process_file(f):
+    name_path = f.rsplit(".",1)[0]+".png"
+    im = load_img(f, output_type="pil")
+    im = im.convert("RGB")
+    transparent = process(im)
+    transparent.save(name_path)
+    return name_path
+def remove_background(image):
+    """Remove background from a single image."""
+    input_images = transform_image(image).unsqueeze(0).to(device)
+    # Prediction
+    with torch.no_grad():
+        preds = birefnet(input_images)[-1].sigmoid().cpu()
+    pred = preds[0].squeeze()
+    # Convert the prediction to a mask
+    mask = (pred * 255).byte()  # Convert to 0-255 range
+    mask_pil = transforms.ToPILImage()(mask).convert("L")
+    mask_resized = mask_pil.resize(image.size, Image.LANCZOS)
+    # Apply the mask to the image
+    image.putalpha(mask_resized)
+    return image, mask_resized
+def process_video(input_video_path):
+    """Process a video to remove the background from each frame."""
+    # Load the video
+    video_clip = VideoFileClip(input_video_path)
+    # Process each frame
+    frames = []
+    for frame in tqdm(video_clip.iter_frames()):
+        frame_pil = Image.fromarray(frame)
+        frame_no_bg, mask_resized = remove_background(frame_pil)
+        path = "{}.png".format(uuid1())
+        frame_no_bg.save(path)
+        frame_no_bg = Image.open(path).convert("RGBA")
+        os.remove(path)
+        # Convert mask_resized to RGBA mode
+        mask_resized_rgba = mask_resized.convert("RGBA")
+        # Apply the mask using ImageChops.multiply
+        output = ImageChops.multiply(frame_no_bg, mask_resized_rgba)
+        output_np = np.array(output)
+        frames.append(output_np)
+    # Save the processed frames as a new video
+    output_video_path = os.path.join(output_folder, "no_bg_video.mp4")
+    processed_clip = ImageSequenceClip(frames, fps=video_clip.fps)
+    processed_clip.write_videofile(output_video_path, codec='libx264', ffmpeg_params=['-pix_fmt', 'yuva420p'])
+    return output_video_path
+# Gradio components
+slider1 = ImageSlider(label="RMBG-2.0", type="pil")
+slider2 = ImageSlider(label="RMBG-2.0", type="pil")
+image = gr.Image(label="Upload an image")
+image2 = gr.Image(label="Upload an image", type="filepath")
+text = gr.Textbox(label="Paste an image URL")
+png_file = gr.File(label="output png file")
+video_input = gr.Video(label="Upload a video")
+video_output = gr.Video(label="Processed video")
+# Example videos
+example_videos = [
+    "pexels-cottonbro-5319934.mp4",
+    "300_A_car_is_running_on_the_road.mp4",
+    "A_Terracotta_Warrior_is_skateboarding_9033688.mp4"
+]
+# Gradio interfaces
+tab1 = gr.Interface(
+    fn, inputs=image, outputs=[slider1, gr.File(label="output png file")], examples=[load_img("giraffe.jpg", output_type="pil")], api_name="image"
+)
+tab2 = gr.Interface(fn, inputs=text, outputs=[slider2, gr.File(label="output png file")], examples=["http://farm9.staticflickr.com/8488/8228323072_76eeddfea3_z.jpg"], api_name="text")
+#tab3 = gr.Interface(process_file, inputs=image2, outputs=png_file, examples=["giraffe.jpg"], api_name="png")
+tab4 = gr.Interface(process_video, inputs=video_input, outputs=video_output, examples=example_videos, api_name="video")
+# Gradio tabbed interface
+demo = gr.TabbedInterface(
+    [tab4, tab1, tab2], ["input video", "input image", "input url"], title="RMBG-2.0 for background removal"
+)
+if __name__ == "__main__":
+    demo.launch(share=True, show_error=True)

giraffe.jpg ADDED Viewed

image_app.py ADDED Viewed

	@@ -0,0 +1,89 @@

+import os
+import gradio as gr
+from gradio_imageslider import ImageSlider
+from loadimg import load_img
+import spaces
+from transformers import AutoModelForImageSegmentation
+import torch
+from torchvision import transforms
+# 检查 CUDA 是否可用
+if torch.cuda.is_available():
+    device = "cuda"
+else:
+    device = "cpu"
+torch.set_float32_matmul_precision(["high", "highest"][0])
+birefnet = AutoModelForImageSegmentation.from_pretrained(
+    "briaai/RMBG-2.0", trust_remote_code=True
+)
+birefnet.to(device)
+transform_image = transforms.Compose(
+    [
+        transforms.Resize((1024, 1024)),
+        transforms.ToTensor(),
+        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
+    ]
+)
+output_folder = 'output_images'
+if not os.path.exists(output_folder):
+    os.makedirs(output_folder)
+def fn(image):
+    im = load_img(image, output_type="pil")
+    im = im.convert("RGB")
+    origin = im.copy()
+    image = process(im)
+    image_path = os.path.join(output_folder, "no_bg_image.png")
+    image.save(image_path)
+    return (image, origin), image_path
+@spaces.GPU
+def process(image):
+    image_size = image.size
+    input_images = transform_image(image).unsqueeze(0).to(device)
+    # Prediction
+    with torch.no_grad():
+        preds = birefnet(input_images)[-1].sigmoid().cpu()
+    pred = preds[0].squeeze()
+    pred_pil = transforms.ToPILImage()(pred)
+    mask = pred_pil.resize(image_size)
+    image.putalpha(mask)
+    return image
+def process_file(f):
+    name_path = f.rsplit(".",1)[0]+".png"
+    im = load_img(f, output_type="pil")
+    im = im.convert("RGB")
+    transparent = process(im)
+    transparent.save(name_path)
+    return name_path
+slider1 = ImageSlider(label="RMBG-2.0", type="pil")
+slider2 = ImageSlider(label="RMBG-2.0", type="pil")
+image = gr.Image(label="Upload an image")
+image2 = gr.Image(label="Upload an image",type="filepath")
+text = gr.Textbox(label="Paste an image URL")
+png_file = gr.File(label="output png file")
+chameleon = load_img("giraffe.jpg", output_type="pil")
+url = "http://farm9.staticflickr.com/8488/8228323072_76eeddfea3_z.jpg"
+tab1 = gr.Interface(
+    fn, inputs=image, outputs=[slider1, gr.File(label="output png file")], examples=[chameleon], api_name="image"
+)
+tab2 = gr.Interface(fn, inputs=text, outputs=[slider2, gr.File(label="output png file")], examples=[url], api_name="text")
+tab3 = gr.Interface(process_file, inputs=image2, outputs=png_file, examples=["giraffe.jpg"], api_name="png")
+demo = gr.TabbedInterface(
+    [tab1, tab2], ["input image", "input url"], title="RMBG-2.0 for background removal"
+)
+if __name__ == "__main__":
+    demo.launch(share=True, show_error=True)

pexels-cottonbro-5319934.mp4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:647dd65864fef5aee16a8033740771a1e0f0e49d51596a8d9d452dc0767cfd54
+size 22477729

requirements.txt ADDED Viewed

	@@ -0,0 +1,19 @@

+torch
+accelerate
+opencv-python
+spaces
+pillow
+numpy
+timm
+kornia
+prettytable
+typing
+scikit-image
+#huggingface_hub
+transformers>=4.39.1
+gradio
+gradio_imageslider
+loadimg>=0.1.1
+httpx[socks]
+huggingface_hub==0.25.0
+moviepy

video_script.py ADDED Viewed

	@@ -0,0 +1,78 @@

+from PIL import Image, ImageChops
+import torch
+from torchvision import transforms
+from transformers import AutoModelForImageSegmentation
+from moviepy.editor import VideoFileClip, ImageSequenceClip
+import numpy as np
+from tqdm import tqdm
+from uuid import uuid1
+import os
+# Load the model
+model = AutoModelForImageSegmentation.from_pretrained('briaai/RMBG-2.0', trust_remote_code=True)
+torch.set_float32_matmul_precision('high')  # Set precision
+model.to('cuda')
+model.eval()
+# Data settings
+image_size = (1024, 1024)
+transform_image = transforms.Compose([
+    transforms.Resize(image_size),
+    transforms.ToTensor(),
+    transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
+])
+def remove_background(image):
+    """Remove background from a single image."""
+    input_images = transform_image(image).unsqueeze(0).to('cuda')
+    # Prediction
+    with torch.no_grad():
+        preds = model(input_images)[-1].sigmoid().cpu()
+    pred = preds[0].squeeze()
+    # Convert the prediction to a mask
+    mask = (pred * 255).byte()  # Convert to 0-255 range
+    mask_pil = transforms.ToPILImage()(mask).convert("L")
+    mask_resized = mask_pil.resize(image.size, Image.LANCZOS)
+    # Apply the mask to the image
+    image.putalpha(mask_resized)
+    return image, mask_resized
+def process_video(input_video_path, output_video_path):
+    """Process a video to remove the background from each frame."""
+    # Load the video
+    video_clip = VideoFileClip(input_video_path)
+    # Process each frame
+    frames = []
+    for frame in tqdm(video_clip.iter_frames()):
+        frame_pil = Image.fromarray(frame)
+        frame_no_bg, mask_resized = remove_background(frame_pil)
+        path = "{}.png".format(uuid1())
+        frame_no_bg.save(path)
+        frame_no_bg = Image.open(path).convert("RGBA")
+        os.remove(path)
+        # Convert mask_resized to RGBA mode
+        mask_resized_rgba = mask_resized.convert("RGBA")
+        # Apply the mask using ImageChops.multiply
+        output = ImageChops.multiply(frame_no_bg, mask_resized_rgba)
+        output_np = np.array(output)
+        frames.append(output_np)
+    # Save the processed frames as a new video
+    processed_clip = ImageSequenceClip(frames, fps=video_clip.fps)
+    processed_clip.write_videofile(output_video_path, codec='libx264', ffmpeg_params=['-pix_fmt', 'yuva420p'])
+if __name__ == "__main__":
+    from IPython import display
+    # Example usage
+    input_video_path = "300_A_car_is_running_on_the_road.mp4"  # Replace with your video path
+    output_video_path = "300_A_car_is_running_on_the_road_no_bg.mp4"
+    process_video(input_video_path, output_video_path)
+    display.Video("300_A_car_is_running_on_the_road_no_bg.mp4")
+    pass