Spaces:

fffiloni
/

PSHuman

Running on L40S

App Files Files Community

PSHuman / lib /pymafx /utils /renderer.py

fffiloni

Migrated from GitHub

2252f3d verified 14 days ago

raw

history blame

23 kB

	import imp
	import os
	from pickle import NONE
	# os.environ['PYOPENGL_PLATFORM'] = 'osmesa'
	import torch
	import trimesh
	import numpy as np
	# import neural_renderer as nr
	from skimage.transform import resize
	from torchvision.utils import make_grid
	import torch.nn.functional as F

	from models.smpl import get_smpl_faces, get_model_faces, get_model_tpose
	from utils.densepose_methods import DensePoseMethods
	from core import constants, path_config
	import json
	from .geometry import convert_to_full_img_cam
	from utils.imutils import crop

	try:
	import math
	import pyrender
	from pyrender.constants import RenderFlags
	except:
	pass
	try:
	from opendr.renderer import ColoredRenderer
	from opendr.lighting import LambertianPointLight, SphericalHarmonics
	from opendr.camera import ProjectPoints
	except:
	pass

	from pytorch3d.structures.meshes import Meshes
	# from pytorch3d.renderer.mesh.renderer import MeshRendererWithFragments

	from pytorch3d.renderer import (
	look_at_view_transform, FoVPerspectiveCameras, PerspectiveCameras, AmbientLights, PointLights,
	RasterizationSettings, BlendParams, MeshRenderer, MeshRasterizer, SoftPhongShader,
	SoftSilhouetteShader, HardPhongShader, HardGouraudShader, HardFlatShader, TexturesVertex
	)

	import logging

	logger = logging.getLogger(__name__)


	class WeakPerspectiveCamera(pyrender.Camera):
	def __init__(
	self, scale, translation, znear=pyrender.camera.DEFAULT_Z_NEAR, zfar=None, name=None
	):
	super(WeakPerspectiveCamera, self).__init__(
	znear=znear,
	zfar=zfar,
	name=name,
	)
	self.scale = scale
	self.translation = translation

	def get_projection_matrix(self, width=None, height=None):
	P = np.eye(4)
	P[0, 0] = self.scale[0]
	P[1, 1] = self.scale[1]
	P[0, 3] = self.translation[0] * self.scale[0]
	P[1, 3] = -self.translation[1] * self.scale[1]
	P[2, 2] = -1
	return P


	class PyRenderer:
	def __init__(
	self, resolution=(224, 224), orig_img=False, wireframe=False, scale_ratio=1., vis_ratio=1.
	):
	self.resolution = (resolution[0] * scale_ratio, resolution[1] * scale_ratio)
	# self.scale_ratio = scale_ratio

	self.faces = {
	'smplx': get_model_faces('smplx'),
	'smpl': get_model_faces('smpl'),
	# 'mano': get_model_faces('mano'),
	# 'flame': get_model_faces('flame'),
	}
	self.orig_img = orig_img
	self.wireframe = wireframe
	self.renderer = pyrender.OffscreenRenderer(
	viewport_width=self.resolution[0], viewport_height=self.resolution[1], point_size=1.0
	)

	self.vis_ratio = vis_ratio

	# set the scene
	self.scene = pyrender.Scene(bg_color=[0.0, 0.0, 0.0, 0.0], ambient_light=(0.3, 0.3, 0.3))

	light = pyrender.PointLight(color=np.array([1.0, 1.0, 1.0]) * 0.2, intensity=1)

	yrot = np.radians(120) # angle of lights

	light_pose = np.eye(4)
	light_pose[:3, 3] = [0, -1, 1]
	self.scene.add(light, pose=light_pose)

	light_pose[:3, 3] = [0, 1, 1]
	self.scene.add(light, pose=light_pose)

	light_pose[:3, 3] = [1, 1, 2]
	self.scene.add(light, pose=light_pose)

	spot_l = pyrender.SpotLight(
	color=np.ones(3), intensity=15.0, innerConeAngle=np.pi / 3, outerConeAngle=np.pi / 2
	)

	light_pose[:3, 3] = [1, 2, 2]
	self.scene.add(spot_l, pose=light_pose)

	light_pose[:3, 3] = [-1, 2, 2]
	self.scene.add(spot_l, pose=light_pose)

	# light_pose[:3, 3] = [-2, 2, 0]
	# self.scene.add(spot_l, pose=light_pose)

	# light_pose[:3, 3] = [-2, 2, 0]
	# self.scene.add(spot_l, pose=light_pose)

	self.colors_dict = {
	'red': np.array([0.5, 0.2, 0.2]),
	'pink': np.array([0.7, 0.5, 0.5]),
	'neutral': np.array([0.7, 0.7, 0.6]),
	# 'purple': np.array([0.5, 0.5, 0.7]),
	'purple': np.array([0.55, 0.4, 0.9]),
	'green': np.array([0.5, 0.55, 0.3]),
	'sky': np.array([0.3, 0.5, 0.55]),
	'white': np.array([1.0, 0.98, 0.94]),
	}

	def __call__(
	self,
	verts,
	faces=None,
	img=np.zeros((224, 224, 3)),
	cam=np.array([1, 0, 0]),
	focal_length=[5000, 5000],
	camera_rotation=np.eye(3),
	crop_info=None,
	angle=None,
	axis=None,
	mesh_filename=None,
	color_type=None,
	color=[1.0, 1.0, 0.9],
	iwp_mode=True,
	crop_img=True,
	mesh_type='smpl',
	scale_ratio=1.,
	rgba_mode=False
	):

	if faces is None:
	faces = self.faces[mesh_type]
	mesh = trimesh.Trimesh(vertices=verts, faces=faces, process=False)

	Rx = trimesh.transformations.rotation_matrix(math.radians(180), [1, 0, 0])
	mesh.apply_transform(Rx)

	if mesh_filename is not None:
	mesh.export(mesh_filename)

	if angle and axis:
	R = trimesh.transformations.rotation_matrix(math.radians(angle), axis)
	mesh.apply_transform(R)

	cam = cam.copy()
	if iwp_mode:
	resolution = np.array(img.shape[:2]) * scale_ratio
	if len(cam) == 4:
	sx, sy, tx, ty = cam
	# sy = sx
	camera_translation = np.array(
	[tx, ty, 2 * focal_length[0] / (resolution[0] * sy + 1e-9)]
	)
	elif len(cam) == 3:
	sx, tx, ty = cam
	sy = sx
	camera_translation = np.array(
	[-tx, ty, 2 * focal_length[0] / (resolution[0] * sy + 1e-9)]
	)
	render_res = resolution
	self.renderer.viewport_width = render_res[1]
	self.renderer.viewport_height = render_res[0]
	else:
	if crop_info['opt_cam_t'] is None:
	camera_translation = convert_to_full_img_cam(
	pare_cam=cam[None],
	bbox_height=crop_info['bbox_scale'] * 200.,
	bbox_center=crop_info['bbox_center'],
	img_w=crop_info['img_w'],
	img_h=crop_info['img_h'],
	focal_length=focal_length[0],
	)
	else:
	camera_translation = crop_info['opt_cam_t']
	if torch.is_tensor(camera_translation):
	camera_translation = camera_translation[0].cpu().numpy()
	camera_translation = camera_translation.copy()
	camera_translation[0] *= -1
	if 'img_h' in crop_info and 'img_w' in crop_info:
	render_res = (int(crop_info['img_h'][0]), int(crop_info['img_w'][0]))
	else:
	render_res = img.shape[:2] if type(img) is not list else img[0].shape[:2]
	self.renderer.viewport_width = render_res[1]
	self.renderer.viewport_height = render_res[0]
	camera_rotation = camera_rotation.T
	camera = pyrender.IntrinsicsCamera(
	fx=focal_length[0], fy=focal_length[1], cx=render_res[1] / 2., cy=render_res[0] / 2.
	)

	if color_type != None:
	color = self.colors_dict[color_type]

	material = pyrender.MetallicRoughnessMaterial(
	metallicFactor=0.2,
	roughnessFactor=0.6,
	alphaMode='OPAQUE',
	baseColorFactor=(color[0], color[1], color[2], 1.0)
	)

	mesh = pyrender.Mesh.from_trimesh(mesh, material=material)

	mesh_node = self.scene.add(mesh, 'mesh')

	camera_pose = np.eye(4)
	camera_pose[:3, :3] = camera_rotation
	camera_pose[:3, 3] = camera_rotation @ camera_translation
	cam_node = self.scene.add(camera, pose=camera_pose)

	if self.wireframe:
	render_flags = RenderFlags.RGBA \| RenderFlags.ALL_WIREFRAME \| RenderFlags.SHADOWS_SPOT
	else:
	render_flags = RenderFlags.RGBA \| RenderFlags.SHADOWS_SPOT

	rgb, _ = self.renderer.render(self.scene, flags=render_flags)
	if crop_info is not None and crop_img:
	crop_res = img.shape[:2]
	rgb, _, _ = crop(rgb, crop_info['bbox_center'][0], crop_info['bbox_scale'][0], crop_res)

	valid_mask = (rgb[:, :, -1] > 0)[:, :, np.newaxis]

	image_list = [img] if type(img) is not list else img

	return_img = []
	for item in image_list:
	if scale_ratio != 1:
	orig_size = item.shape[:2]
	item = resize(
	item, (orig_size[0] * scale_ratio, orig_size[1] * scale_ratio),
	anti_aliasing=True
	)
	item = (item * 255).astype(np.uint8)
	output_img = rgb[:, :, :-1] * valid_mask * self.vis_ratio + (
	1 - valid_mask * self.vis_ratio
	) * item
	# output_img[valid_mask < 0.5] = item[valid_mask < 0.5]
	# if scale_ratio != 1:
	# output_img = resize(output_img, (orig_size[0], orig_size[1]), anti_aliasing=True)
	if rgba_mode:
	output_img_rgba = np.zeros((output_img.shape[0], output_img.shape[1], 4))
	output_img_rgba[:, :, :3] = output_img
	output_img_rgba[:, :, 3][valid_mask[:, :, 0]] = 255
	output_img = output_img_rgba.astype(np.uint8)
	image = output_img.astype(np.uint8)
	return_img.append(image)
	return_img.append(item)

	if type(img) is not list:
	# if scale_ratio == 1:
	return_img = return_img[0]

	self.scene.remove_node(mesh_node)
	self.scene.remove_node(cam_node)

	return return_img


	class OpenDRenderer:
	def __init__(self, resolution=(224, 224), ratio=1):
	self.resolution = (resolution[0] * ratio, resolution[1] * ratio)
	self.ratio = ratio
	self.focal_length = 5000.
	self.K = np.array(
	[
	[self.focal_length, 0., self.resolution[1] / 2.],
	[0., self.focal_length, self.resolution[0] / 2.], [0., 0., 1.]
	]
	)
	self.colors_dict = {
	'red': np.array([0.5, 0.2, 0.2]),
	'pink': np.array([0.7, 0.5, 0.5]),
	'neutral': np.array([0.7, 0.7, 0.6]),
	'purple': np.array([0.5, 0.5, 0.7]),
	'green': np.array([0.5, 0.55, 0.3]),
	'sky': np.array([0.3, 0.5, 0.55]),
	'white': np.array([1.0, 0.98, 0.94]),
	}
	self.renderer = ColoredRenderer()
	self.faces = get_smpl_faces()

	def reset_res(self, resolution):
	self.resolution = (resolution[0] * self.ratio, resolution[1] * self.ratio)
	self.K = np.array(
	[
	[self.focal_length, 0., self.resolution[1] / 2.],
	[0., self.focal_length, self.resolution[0] / 2.], [0., 0., 1.]
	]
	)

	def __call__(
	self,
	verts,
	faces=None,
	color=None,
	color_type='white',
	R=None,
	mesh_filename=None,
	img=np.zeros((224, 224, 3)),
	cam=np.array([1, 0, 0]),
	rgba=False,
	addlight=True
	):
	'''Render mesh using OpenDR
	verts: shape - (V, 3)
	faces: shape - (F, 3)
	img: shape - (224, 224, 3), range - [0, 255] (np.uint8)
	axis: rotate along with X/Y/Z axis (by angle)
	R: rotation matrix (used to manipulate verts) shape - [3, 3]
	Return:
	rendered img: shape - (224, 224, 3), range - [0, 255] (np.uint8)
	'''
	## Create OpenDR renderer
	rn = self.renderer
	h, w = self.resolution
	K = self.K

	f = np.array([K[0, 0], K[1, 1]])
	c = np.array([K[0, 2], K[1, 2]])

	if faces is None:
	faces = self.faces
	if len(cam) == 4:
	t = np.array([cam[2], cam[3], 2 * K[0, 0] / (w * cam[0] + 1e-9)])
	elif len(cam) == 3:
	t = np.array([cam[1], cam[2], 2 * K[0, 0] / (w * cam[0] + 1e-9)])

	rn.camera = ProjectPoints(rt=np.array([0, 0, 0]), t=t, f=f, c=c, k=np.zeros(5))
	rn.frustum = {'near': 1., 'far': 1000., 'width': w, 'height': h}

	albedo = np.ones_like(verts) * .9

	if color is not None:
	color0 = np.array(color)
	color1 = np.array(color)
	color2 = np.array(color)
	elif color_type == 'white':
	color0 = np.array([1., 1., 1.])
	color1 = np.array([1., 1., 1.])
	color2 = np.array([0.7, 0.7, 0.7])
	color = np.ones_like(verts) * self.colors_dict[color_type][None, :]
	else:
	color0 = self.colors_dict[color_type] * 1.2
	color1 = self.colors_dict[color_type] * 1.2
	color2 = self.colors_dict[color_type] * 1.2
	color = np.ones_like(verts) * self.colors_dict[color_type][None, :]

	# render_smpl = rn.r
	if R is not None:
	assert R.shape == (3, 3), "Shape of rotation matrix should be (3, 3)"
	verts = np.dot(verts, R)

	rn.set(v=verts, f=faces, vc=color, bgcolor=np.zeros(3))

	if addlight:
	yrot = np.radians(120) # angle of lights
	# # 1. 1. 0.7
	rn.vc = LambertianPointLight(
	f=rn.f,
	v=rn.v,
	num_verts=len(rn.v),
	light_pos=rotateY(np.array([-200, -100, -100]), yrot),
	vc=albedo,
	light_color=color0
	)

	# Construct Left Light
	rn.vc += LambertianPointLight(
	f=rn.f,
	v=rn.v,
	num_verts=len(rn.v),
	light_pos=rotateY(np.array([800, 10, 300]), yrot),
	vc=albedo,
	light_color=color1
	)

	# Construct Right Light
	rn.vc += LambertianPointLight(
	f=rn.f,
	v=rn.v,
	num_verts=len(rn.v),
	light_pos=rotateY(np.array([-500, 500, 1000]), yrot),
	vc=albedo,
	light_color=color2
	)

	rendered_image = rn.r
	visibility_image = rn.visibility_image

	image_list = [img] if type(img) is not list else img

	return_img = []
	for item in image_list:
	if self.ratio != 1:
	img_resized = resize(
	item, (item.shape[0] * self.ratio, item.shape[1] * self.ratio),
	anti_aliasing=True
	)
	else:
	img_resized = item / 255.

	try:
	img_resized[visibility_image != (2**32 - 1)
	] = rendered_image[visibility_image != (2**32 - 1)]
	except:
	logger.warning('Can not render mesh.')

	img_resized = (img_resized * 255).astype(np.uint8)
	res = img_resized

	if rgba:
	img_resized_rgba = np.zeros((img_resized.shape[0], img_resized.shape[1], 4))
	img_resized_rgba[:, :, :3] = img_resized
	img_resized_rgba[:, :, 3][visibility_image != (2**32 - 1)] = 255
	res = img_resized_rgba.astype(np.uint8)
	return_img.append(res)

	if type(img) is not list:
	return_img = return_img[0]

	return return_img


	# https://github.com/classner/up/blob/master/up_tools/camera.py
	def rotateY(points, angle):
	"""Rotate all points in a 2D array around the y axis."""
	ry = np.array(
	[[np.cos(angle), 0., np.sin(angle)], [0., 1., 0.], [-np.sin(angle), 0.,
	np.cos(angle)]]
	)
	return np.dot(points, ry)


	def rotateX(points, angle):
	"""Rotate all points in a 2D array around the x axis."""
	rx = np.array(
	[[1., 0., 0.], [0., np.cos(angle), -np.sin(angle)], [0., np.sin(angle),
	np.cos(angle)]]
	)
	return np.dot(points, rx)


	def rotateZ(points, angle):
	"""Rotate all points in a 2D array around the z axis."""
	rz = np.array(
	[[np.cos(angle), -np.sin(angle), 0.], [np.sin(angle), np.cos(angle), 0.], [0., 0., 1.]]
	)
	return np.dot(points, rz)


	class IUV_Renderer(object):
	def __init__(
	self,
	focal_length=5000.,
	orig_size=224,
	output_size=56,
	mode='iuv',
	device=torch.device('cuda'),
	mesh_type='smpl'
	):

	self.focal_length = focal_length
	self.orig_size = orig_size
	self.output_size = output_size

	if mode in ['iuv']:
	if mesh_type == 'smpl':
	DP = DensePoseMethods()

	vert_mapping = DP.All_vertices.astype('int64') - 1
	self.vert_mapping = torch.from_numpy(vert_mapping)

	faces = DP.FacesDensePose
	faces = faces[None, :, :]
	self.faces = torch.from_numpy(
	faces.astype(np.int32)
	) # [1, 13774, 3], torch.int32

	num_part = float(np.max(DP.FaceIndices))
	self.num_part = num_part

	dp_vert_pid_fname = 'data/dp_vert_pid.npy'
	if os.path.exists(dp_vert_pid_fname):
	dp_vert_pid = list(np.load(dp_vert_pid_fname))
	else:
	print('creating data/dp_vert_pid.npy')
	dp_vert_pid = []
	for v in range(len(vert_mapping)):
	for i, f in enumerate(DP.FacesDensePose):
	if v in f:
	dp_vert_pid.append(DP.FaceIndices[i])
	break
	np.save(dp_vert_pid_fname, np.array(dp_vert_pid))

	textures_vts = np.array(
	[
	(dp_vert_pid[i] / num_part, DP.U_norm[i], DP.V_norm[i])
	for i in range(len(vert_mapping))
	]
	)
	self.textures_vts = torch.from_numpy(
	textures_vts[None].astype(np.float32)
	) # (1, 7829, 3)
	elif mode == 'pncc':
	self.vert_mapping = None
	self.faces = torch.from_numpy(
	get_model_faces(mesh_type)[None].astype(np.int32)
	) # mano: torch.Size([1, 1538, 3])
	textures_vts = get_model_tpose(mesh_type).unsqueeze(
	0
	) # mano: torch.Size([1, 778, 3])

	texture_min = torch.min(textures_vts) - 0.001
	texture_range = torch.max(textures_vts) - texture_min + 0.001
	self.textures_vts = (textures_vts - texture_min) / texture_range
	elif mode in ['seg']:
	self.vert_mapping = None
	body_model = 'smpl'

	self.faces = torch.from_numpy(get_smpl_faces().astype(np.int32)[None])

	with open(
	os.path.join(
	path_config.SMPL_MODEL_DIR, '{}_vert_segmentation.json'.format(body_model)
	), 'rb'
	) as json_file:
	smpl_part_id = json.load(json_file)

	v_id = []
	for k in smpl_part_id.keys():
	v_id.extend(smpl_part_id[k])

	v_id = torch.tensor(v_id)
	n_verts = len(torch.unique(v_id))
	num_part = len(constants.SMPL_PART_ID.keys())
	self.num_part = num_part

	seg_vert_pid = np.zeros(n_verts)
	for k in smpl_part_id.keys():
	seg_vert_pid[smpl_part_id[k]] = constants.SMPL_PART_ID[k]

	print('seg_vert_pid', seg_vert_pid.shape)
	textures_vts = seg_vert_pid[:, None].repeat(3, axis=1) / num_part
	print('textures_vts', textures_vts.shape)
	# textures_vts = np.array(
	# [(seg_vert_pid[i] / num_part,) * 3 for i in
	# range(n_verts)])
	self.textures_vts = torch.from_numpy(textures_vts[None].astype(np.float32))

	K = np.array(
	[
	[self.focal_length, 0., self.orig_size / 2.],
	[0., self.focal_length, self.orig_size / 2.], [0., 0., 1.]
	]
	)

	R = np.array([[-1., 0., 0.], [0., -1., 0.], [0., 0., 1.]])

	t = np.array([0, 0, 5])

	if self.orig_size != 224:
	rander_scale = self.orig_size / float(224)
	K[0, 0] *= rander_scale
	K[1, 1] *= rander_scale
	K[0, 2] *= rander_scale
	K[1, 2] *= rander_scale

	self.K = torch.FloatTensor(K[None, :, :])
	self.R = torch.FloatTensor(R[None, :, :])
	self.t = torch.FloatTensor(t[None, None, :])

	camK = F.pad(self.K, (0, 1, 0, 1), "constant", 0)
	camK[:, 2, 2] = 0
	camK[:, 3, 2] = 1
	camK[:, 2, 3] = 1

	self.K = camK

	self.device = device
	lights = AmbientLights(device=self.device)

	raster_settings = RasterizationSettings(
	image_size=output_size,
	blur_radius=0,
	faces_per_pixel=1,
	)
	self.renderer = MeshRenderer(
	rasterizer=MeshRasterizer(raster_settings=raster_settings),
	shader=HardFlatShader(
	device=self.device,
	lights=lights,
	blend_params=BlendParams(background_color=[0, 0, 0], sigma=0.0, gamma=0.0)
	)
	)

	def camera_matrix(self, cam):
	batch_size = cam.size(0)

	K = self.K.repeat(batch_size, 1, 1)
	R = self.R.repeat(batch_size, 1, 1)
	t = torch.stack(
	[-cam[:, 1], -cam[:, 2], 2 * self.focal_length / (self.orig_size * cam[:, 0] + 1e-9)],
	dim=-1
	)

	if cam.is_cuda:
	# device_id = cam.get_device()
	K = K.to(cam.device)
	R = R.to(cam.device)
	t = t.to(cam.device)

	return K, R, t

	def verts2iuvimg(self, verts, cam, iwp_mode=True):
	batch_size = verts.size(0)

	K, R, t = self.camera_matrix(cam)

	if self.vert_mapping is None:
	vertices = verts
	else:
	vertices = verts[:, self.vert_mapping, :]

	mesh = Meshes(vertices, self.faces.to(verts.device).expand(batch_size, -1, -1))
	mesh.textures = TexturesVertex(
	verts_features=self.textures_vts.to(verts.device).expand(batch_size, -1, -1)
	)

	cameras = PerspectiveCameras(
	device=verts.device,
	R=R,
	T=t,
	K=K,
	in_ndc=False,
	image_size=[(self.orig_size, self.orig_size)]
	)

	iuv_image = self.renderer(mesh, cameras=cameras)
	iuv_image = iuv_image[..., :3].permute(0, 3, 1, 2)

	return iuv_image