DesignEdit

Sleeping

jiayueru

update code

37ee4a4 7 months ago

14.2 kB

	import cv2
	from matplotlib import pyplot as plt
	import numpy as np
	import torch
	from PIL import Image, ImageDraw, ImageFont
	from datetime import datetime
	import os
	from typing import List, Dict

	def convert_and_resize_mask(mask):
	if mask.ndim == 3:
	mask = cv2.cvtColor(mask, cv2.COLOR_BGR2GRAY)
	resized_mask = cv2.resize(mask, (1024, 1024))
	return resized_mask

	def add_masks_resized(masks):
	final_mask = np.zeros((1024, 1024), dtype=np.uint8)
	for mask in masks:
	if mask is not None:
	resized_mask = convert_and_resize_mask(mask)
	resized_mask = resized_mask.astype(np.uint8)
	final_mask = cv2.add(final_mask, resized_mask)
	return final_mask

	def attend_mask(mask_file, attend_scale=10, save=False):
	if isinstance(mask_file, str):
	if mask_file == '':
	return torch.zeros([1, 1, 128, 128], dtype=torch.float32).cuda()
	else:
	image_with_mask = cv2.imread(mask_file, cv2.IMREAD_GRAYSCALE)
	elif len(mask_file.shape) == 3: # convert RGB to gray
	image_with_mask = cv2.cvtColor(mask_file, cv2.COLOR_BGR2GRAY)

	else:
	image_with_mask = mask_file

	if attend_scale != 0:
	kernel = np.ones((abs(attend_scale), abs(attend_scale)), np.uint8)
	if attend_scale > 0:
	image_with_mask = cv2.dilate(image_with_mask, kernel, iterations=1)
	else:
	image_with_mask = cv2.erode(image_with_mask, kernel, iterations=1)

	if save and isinstance(mask_file, str):
	new_mask_file_name = mask_file[:-4]+'_'+str(attend_scale)+'.jpg'
	cv2.imwrite(new_mask_file_name, image_with_mask)
	print("new_mask is saved in ", new_mask_file_name)

	dilated_image= cv2.resize(image_with_mask, (128, 128), interpolation=cv2.INTER_NEAREST)
	dilated_image = torch.from_numpy(dilated_image).to(torch.float32).unsqueeze(0).unsqueeze(0).cuda() / 255
	return dilated_image


	def panning(img_path=None, op_list=[['left', 0.2]], save=False, save_dir=None):
	if isinstance(img_path, str):
	img = cv2.imread(img_path)
	else:
	img = img_path
	img_new = img.copy()
	img_height, img_width, _ = img.shape
	w_mask = 255 * np.ones((img_height, img_width), dtype=np.uint8)
	h_mask = 255 * np.ones((img_height, img_width), dtype=np.uint8)

	for op in op_list:
	scale = op[1]
	if op[0] in ['right', 'left']:
	K = int(scale*img_width)
	elif op[0] in ['up', 'down']:
	K = int(scale*img_height)

	if op[0] == 'right':
	img_new[:, K:, :] = img[:, 0:img_width-K, :]
	w_mask[:, K:] = 0
	elif op[0] == 'left':
	img_new[:, 0:img_width-K, :] = img[:, K:, :]
	w_mask[:, 0:img_width-K] = 0
	elif op[0] == 'down':
	img_new[K:, :, :] = img[0:img_height-K, :, :]
	h_mask[K:, :] = 0
	elif op[0] == 'up':
	img_new[0:img_height-K, :, :] = img[K:, :, :]
	h_mask[0:img_height-K, :] = 0
	img = img_new

	mask = w_mask + h_mask
	mask[mask>0] = 255

	if save:
	if save_dir is None:
	base_dir = os.path.dirname(img_path)
	save_dir = os.path.join(base_dir, 'preprocess')
	elif not os.path.exists(save_dir):
	os.makedirs(save_dir)
	resized_img_name = f"{save_dir}/resized_image.png"
	resized_mask_name = f"{save_dir}/resized_mask.png"
	cv2.imwrite(resized_img_name, img_new)
	cv2.imwrite(resized_mask_name, mask)
	return resized_img_name, resized_mask_name
	else:
	return img_new, mask

	def zooming(img_path=None, scale=[0.8, 0.8], save=False, save_dir=None):
	if isinstance(img_path, str):
	img = cv2.imread(img_path)
	else:
	img = img_path
	img_new = img.copy()
	img_height, img_width, _ = img.shape
	mask = 255 * np.ones((img_height, img_width), dtype=np.uint8)

	new_height = int(img_height*scale[0])
	new_width = int(img_width*scale[1])
	resized_img = cv2.resize(img, (new_width, new_height), interpolation=cv2.INTER_AREA)
	x_offset = (img_width - new_width) // 2
	y_offset = (img_height - new_height) // 2

	img_new[y_offset:y_offset + new_height, x_offset:x_offset + new_width] = resized_img
	mask[y_offset:y_offset + new_height, x_offset:x_offset + new_width] = 0

	if save:
	if save_dir is None:
	base_dir = os.path.dirname(img_path)
	save_dir = os.path.join(base_dir, 'preprocess')
	elif not os.path.exists(save_dir):
	os.makedirs(save_dir)

	resized_img_name = f"{save_dir}/resized_image.png"
	resized_mask_name = f"{save_dir}/resized_mask.png"
	cv2.imwrite(resized_img_name, img_new)
	cv2.imwrite(resized_mask_name, mask)
	return resized_img_name, resized_mask_name
	else:
	return img_new, mask

	def get_box(mask, bias = 2):
	nonzero_indices = torch.nonzero(mask)
	H, W = mask.shape[-2:]
	min_x = max(min(nonzero_indices[:, 1]) - bias, 0)
	min_y = max(min(nonzero_indices[:, 0]) - bias, 0)
	max_x = min(max(nonzero_indices[:, 1]) + bias, W)
	max_y = min(max(nonzero_indices[:, 0]) + bias, H)
	return (min_x, min_y, max_x, max_y)


	def draw_axis(img,grid_dict,x_len,y_len):
	if grid_dict is not None and grid_dict is not False:
	assert isinstance(grid_dict,Dict)
	assert "x_title" in grid_dict
	assert "y_title" in grid_dict
	assert "x_text_list" in grid_dict
	assert "y_text_list" in grid_dict
	x_title=grid_dict["x_title"]
	y_title=grid_dict["y_title"]
	x_text_list=grid_dict['x_text_list']
	y_text_list=grid_dict['y_text_list']
	assert len(y_text_list)==y_len
	assert len(x_text_list)==x_len
	assert "font_size" in grid_dict
	font_size=grid_dict["font_size"]
	if "x_color" in grid_dict:
	color_x=grid_dict['x_color']
	else:
	color_x="black"
	if "y_color" in grid_dict:
	color_y=grid_dict['y_color']
	else:
	color_y="black"
	if "num_decimals" in grid_dict:
	num_decimals=grid_dict['num_decimals']
	else:
	num_decimals=2
	if "shift_x" in grid_dict:
	shift_x_x,shift_x_y=grid_dict['shift_x']
	else:
	shift_x_x=shift_x_y=0
	if "shift_y" in grid_dict:
	shift_y_x,shift_y_y=grid_dict['shift_y']
	else:
	shift_y_x=shift_y_y=0
	if "title" in grid_dict:
	title=grid_dict['title']
	if isinstance(title,List):
	all_title=""
	for s in title:
	all_title=all_title+s+"\n"
	title=all_title
	else:
	title=''
	width, height = img.size
	num_x=x_len
	num_y=y_len

	new_img = Image.new("RGB", (width + width // num_x+width // (num_x2), height + height // num_y+height // (num_y2)), color=(255, 255, 255))
	width,height=(width + width // num_x, height + height // num_y)
	num_x=num_x+1
	num_y=num_y+1
	new_img.paste(img, (width // num_x, height // num_y))

	draw = ImageDraw.Draw(new_img)

	font = ImageFont.truetype("DejaVuSansMono.ttf", font_size)
	for i in range(2, num_x+1):
	x = (i - 1) * width // num_x + width // (num_x * 2)-width *0.2// num_x+shift_x_x
	y = height // (num_y * 2)+shift_x_y
	k=i-1
	if isinstance(x_text_list[i-2],str):
	draw.text((x, y), x_text_list[i-2], font=font,fill=color_x,align="center")
	else:
	draw.text((x, y), "{:.{}f}".format(x_text_list[i-2],num_decimals), font=font,fill=color_x,align="center")

	for i in range(2, num_y+1):
	x = width // (num_x * 2)-width *0.1// num_x+shift_y_x
	y = (i - 1) * height // num_y + height // (num_y * 2)-height*0.1//num_y+shift_y_y
	k = i - 1
	if isinstance(y_text_list[i-2],str):
	draw.text((x, y), y_text_list[i-2], font=font,fill=color_y,align="center")
	else:
	draw.text((x, y), "{:.{}f}".format(y_text_list[i-2],num_decimals), font=font,fill=color_y,align="center")
	i=1
	x = (i - 1) * width // num_x + width // (num_x * 2)-height*0.1//num_y+shift_y_x
	y = height // (num_y * 2)+width *0.2// num_x+shift_y_y
	draw.text((x, y), y_title, font=font, fill=color_y,align="center")
	x = width // (num_x * 2)+width *0.2// num_x+shift_x_x
	y = (i - 1) * height // num_y + height // (num_y * 2)+shift_x_y
	draw.text((x, y), x_title, font=font, fill=color_x,align="left")
	x = width // 4
	y = (i - 1) * height // num_y + height // (num_y * 10)
	draw.text((x, y), title, font=font, fill='blue',align="left")
	else:

	new_img=img
	return new_img

	def view_images(images, num_rows=1, offset_ratio=0.02,text="",folder=None,Notimestamp=False,
	grid_dict=None,subfolder=None,verbose=True,output_dir=None,timestamp=None,**kwargs):
	if type(images) is list:
	num_empty = len(images) % num_rows
	elif images.ndim == 4:
	num_empty = images.shape[0] % num_rows
	else:
	images = [images]
	num_empty = 0
	origin_size=kwargs.get("origin_size",None)
	images_copy=images.copy()
	for i, per_image in enumerate(images_copy):
	if isinstance(per_image, Image.Image) and origin_size is not None:
	images[i] = np.array(per_image.resize((origin_size[1],origin_size[0])))
	else:
	images[i] = np.array(per_image)

	empty_images = np.ones(images[0].shape, dtype=np.uint8) * 255
	images = [image.astype(np.uint8) for image in images] + [empty_images] * num_empty
	num_items = len(images)

	h, w, c = images[0].shape
	offset = int(h * offset_ratio)
	num_cols = num_items // num_rows
	image_ = np.ones((h * num_rows + offset * (num_rows - 1),
	w * num_cols + offset * (num_cols - 1), 3), dtype=np.uint8) * 255
	for i in range(num_rows):
	for j in range(num_cols):
	image_[i * (h + offset): i * (h + offset) + h:, j * (w + offset): j * (w + offset) + w] = images[
	i * num_cols + j]

	pil_img = Image.fromarray(image_)

	pil_img_=draw_axis(pil_img,grid_dict,num_cols,num_rows)
	if pil_img_.size[0]==pil_img_.size[1]:
	pil_img_.resize((2048,2048))
	else:
	longer_side = max(pil_img.size)
	ratio = 2048/longer_side
	new_size = tuple([int(x*ratio) for x in pil_img.size])
	pil_img = pil_img.resize(new_size)

	if verbose is False:
	return pil_img
	now = datetime.now()
	if timestamp is None:
	if Notimestamp is False:
	timestamp = now.strftime("%Y-%m-%d_%H-%M-%S")
	else:
	timestamp=""
	if output_dir is None:
	if timestamp != "":
	date, time = timestamp.split('_')
	else:
	date, time = "",""
	if folder is not None:
	dirname="./"+folder
	filename = text+f"img_{timestamp}.jpg"
	else:
	if subfolder is not None:
	dirname=os.path.join("./img", subfolder,date)
	dirname=os.path.join(dirname,time)
	filename =text+f"img_{timestamp}.jpg"
	else:
	dirname=os.path.join("./img",date)
	dirname=os.path.join(dirname,time)
	filename =text+f"img_{timestamp}.jpg"
	else:
	dirname=output_dir
	filename =text+f"img_{timestamp}.jpg"
	if not os.path.exists(dirname):
	os.makedirs(dirname)
	if verbose is True:
	for i, img in enumerate(images):
	im = Image.fromarray(img)
	im.save(os.path.join(dirname,f"{i}.jpg"))
	print(f"Output dir: {dirname}")
	pil_img.save(os.path.join(dirname, filename))
	if grid_dict is not None and grid_dict is not False:
	if not os.path.exists(dirname):
	os.makedirs(dirname)
	pil_img_.save(os.path.join(dirname, filename[:-4]+"_2048x.jpg"))

	def resize_image_with_mask(img, mask, scale):
	if scale == 1:
	return img, mask, None
	img_blackboard = img.copy() # canvas
	mask_blackboard = np.zeros_like(mask)

	M = cv2.moments(mask)
	cx = int(M["m10"] / M["m00"])
	cy = int(M["m01"] / M["m00"])

	scale_factor = [scale, scale]
	resized_img = cv2.resize(img, None, fx=scale_factor[0], fy=scale_factor[1], interpolation=cv2.INTER_AREA)
	resized_mask = cv2.resize(mask, None, fx=scale_factor[0], fy=scale_factor[1], interpolation=cv2.INTER_AREA)
	new_cx, new_cy = cx * scale_factor[0], cy * scale_factor[1]

	for y in range(resized_mask.shape[0]):
	for x in range(resized_mask.shape[1]):
	if 0 <= cy - (new_cy - y) < img.shape[0] and 0 <= cx - (new_cx - x) < img.shape[1]:
	mask_blackboard[int(cy - (new_cy - y)), int(cx - (new_cx - x))] = resized_mask[y, x]
	img_blackboard[int(cy - (new_cy - y)), int(cx - (new_cx - x))] = resized_img[y, x]
	return img_blackboard, mask_blackboard, (cx, cy)

	def flip_image_with_mask(img, mask, flip_code=None):
	if flip_code is None:
	return img, mask, None
	M = cv2.moments(mask)
	if M["m00"] == 0:
	return img, mask
	cx = int(M["m10"] / M["m00"])
	cy = int(M["m01"] / M["m00"])

	h, w = img.shape[:2]
	img_center = (w // 2, h // 2)

	tx = img_center[0] - cx
	ty = img_center[1] - cy

	M_translate = np.float32([[1, 0, tx], [0, 1, ty]])
	img_translated = cv2.warpAffine(img, M_translate, (w, h))
	mask_translated = cv2.warpAffine(mask, M_translate, (w, h))
	flipped_img = cv2.flip(img_translated, flip_code)
	flipped_mask = cv2.flip(mask_translated, flip_code)
	M_translate_back = np.float32([[1, 0, -tx], [0, 1, -ty]])
	flipped_img_back = cv2.warpAffine(flipped_img, M_translate_back, (w, h))
	flipped_mask_back = cv2.warpAffine(flipped_mask, M_translate_back, (w, h))

	return flipped_img_back, flipped_mask_back, (cx, cy)