Spaces:
Running
on
L40S
Running
on
L40S
File size: 3,294 Bytes
e3e5f9e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 |
import os, sys
sys.path.insert(0, f"{os.path.dirname(os.path.dirname(os.path.abspath(__file__)))}")
import numpy as np
from PIL import Image
from rembg import remove, new_session
from infer.utils import timing_decorator
class Removebg():
def __init__(self, name="u2net"):
self.session = new_session(name)
@timing_decorator("remove background")
def __call__(self, rgb_maybe, force=True):
'''
args:
rgb_maybe: PIL.Image, with RGB mode or RGBA mode
force: bool, if input is RGBA mode, covert to RGB then remove bg
return:
rgba_img: PIL.Image, with RGBA mode
'''
if rgb_maybe.mode == "RGBA":
if force:
rgb_maybe = rgb_maybe.convert("RGB")
rgba_img = remove(rgb_maybe, session=self.session)
else:
rgba_img = rgb_maybe
else:
rgba_img = remove(rgb_maybe, session=self.session)
rgba_img = white_out_background(rgba_img)
rgba_img = preprocess(rgba_img)
return rgba_img
def white_out_background(pil_img):
data = pil_img.getdata()
new_data = []
for r, g, b, a in data:
if a < 16: # background
new_data.append((255, 255, 255, 0)) # full white color
else:
is_white = (r>235) and (g>235) and (b>235)
new_r = 235 if is_white else r
new_g = 235 if is_white else g
new_b = 235 if is_white else b
new_data.append((new_r, new_g, new_b, a))
pil_img.putdata(new_data)
return pil_img
def preprocess(rgba_img, size=(512,512), ratio=1.15):
image = np.asarray(rgba_img)
rgb, alpha = image[:,:,:3] / 255., image[:,:,3:] / 255.
# crop
coords = np.nonzero(alpha > 0.1)
x_min, x_max = coords[0].min(), coords[0].max()
y_min, y_max = coords[1].min(), coords[1].max()
rgb = (rgb[x_min:x_max, y_min:y_max, :] * 255).astype("uint8")
alpha = (alpha[x_min:x_max, y_min:y_max, 0] * 255).astype("uint8")
# padding
h, w = rgb.shape[:2]
resize_side = int(max(h, w) * ratio)
pad_h, pad_w = resize_side - h, resize_side - w
start_h, start_w = pad_h // 2, pad_w // 2
new_rgb = np.ones((resize_side, resize_side, 3), dtype=np.uint8) * 255
new_alpha = np.zeros((resize_side, resize_side), dtype=np.uint8)
new_rgb[start_h:start_h + h, start_w:start_w + w] = rgb
new_alpha[start_h:start_h + h, start_w:start_w + w] = alpha
rgba_array = np.concatenate((new_rgb, new_alpha[:,:,None]), axis=-1)
rgba_image = Image.fromarray(rgba_array, 'RGBA')
rgba_image = rgba_image.resize(size)
return rgba_image
if __name__ == "__main__":
import argparse
def get_args():
parser = argparse.ArgumentParser()
parser.add_argument("--rgb_path", type=str, required=True)
parser.add_argument("--output_rgba_path", type=str, required=True)
parser.add_argument("--force", default=False, action="store_true")
return parser.parse_args()
args = get_args()
rgb_maybe = Image.open(args.rgb_path)
model = Removebg()
rgba_pil = model(rgb_maybe, args.force)
rgba_pil.save(args.output_rgba_path)
|