Spaces:

geopavlakos
/

HaMeR

Build error

App Files Files Community

HaMeR / hamer /utils /renderer.py

geopavlakos

Initial commit

d7a991a 12 months ago

raw

history blame contribute delete

15.6 kB

	import os
	#if 'PYOPENGL_PLATFORM' not in os.environ:
	# os.environ['PYOPENGL_PLATFORM'] = 'egl'
	import torch
	import numpy as np
	import pyrender
	import trimesh
	import cv2
	from yacs.config import CfgNode
	from typing import List, Optional

	def cam_crop_to_full(cam_bbox, box_center, box_size, img_size, focal_length=5000.):
	# Convert cam_bbox to full image
	img_w, img_h = img_size[:, 0], img_size[:, 1]
	cx, cy, b = box_center[:, 0], box_center[:, 1], box_size
	w_2, h_2 = img_w / 2., img_h / 2.
	bs = b * cam_bbox[:, 0] + 1e-9
	tz = 2 * focal_length / bs
	tx = (2 * (cx - w_2) / bs) + cam_bbox[:, 1]
	ty = (2 * (cy - h_2) / bs) + cam_bbox[:, 2]
	full_cam = torch.stack([tx, ty, tz], dim=-1)
	return full_cam

	def get_light_poses(n_lights=5, elevation=np.pi / 3, dist=12):
	# get lights in a circle around origin at elevation
	thetas = elevation * np.ones(n_lights)
	phis = 2 * np.pi * np.arange(n_lights) / n_lights
	poses = []
	trans = make_translation(torch.tensor([0, 0, dist]))
	for phi, theta in zip(phis, thetas):
	rot = make_rotation(rx=-theta, ry=phi, order="xyz")
	poses.append((rot @ trans).numpy())
	return poses

	def make_translation(t):
	return make_4x4_pose(torch.eye(3), t)

	def make_rotation(rx=0, ry=0, rz=0, order="xyz"):
	Rx = rotx(rx)
	Ry = roty(ry)
	Rz = rotz(rz)
	if order == "xyz":
	R = Rz @ Ry @ Rx
	elif order == "xzy":
	R = Ry @ Rz @ Rx
	elif order == "yxz":
	R = Rz @ Rx @ Ry
	elif order == "yzx":
	R = Rx @ Rz @ Ry
	elif order == "zyx":
	R = Rx @ Ry @ Rz
	elif order == "zxy":
	R = Ry @ Rx @ Rz
	return make_4x4_pose(R, torch.zeros(3))

	def make_4x4_pose(R, t):
	"""
	:param R (*, 3, 3)
	:param t (*, 3)
	return (*, 4, 4)
	"""
	dims = R.shape[:-2]
	pose_3x4 = torch.cat([R, t.view(*dims, 3, 1)], dim=-1)
	bottom = (
	torch.tensor([0, 0, 0, 1], device=R.device)
	.reshape((1,) len(dims), 1, 4)
	.expand(*dims, 1, 4)
	)
	return torch.cat([pose_3x4, bottom], dim=-2)


	def rotx(theta):
	return torch.tensor(
	[
	[1, 0, 0],
	[0, np.cos(theta), -np.sin(theta)],
	[0, np.sin(theta), np.cos(theta)],
	],
	dtype=torch.float32,
	)


	def roty(theta):
	return torch.tensor(
	[
	[np.cos(theta), 0, np.sin(theta)],
	[0, 1, 0],
	[-np.sin(theta), 0, np.cos(theta)],
	],
	dtype=torch.float32,
	)


	def rotz(theta):
	return torch.tensor(
	[
	[np.cos(theta), -np.sin(theta), 0],
	[np.sin(theta), np.cos(theta), 0],
	[0, 0, 1],
	],
	dtype=torch.float32,
	)


	def create_raymond_lights() -> List[pyrender.Node]:
	"""
	Return raymond light nodes for the scene.
	"""
	thetas = np.pi * np.array([1.0 / 6.0, 1.0 / 6.0, 1.0 / 6.0])
	phis = np.pi * np.array([0.0, 2.0 / 3.0, 4.0 / 3.0])

	nodes = []

	for phi, theta in zip(phis, thetas):
	xp = np.sin(theta) * np.cos(phi)
	yp = np.sin(theta) * np.sin(phi)
	zp = np.cos(theta)

	z = np.array([xp, yp, zp])
	z = z / np.linalg.norm(z)
	x = np.array([-z[1], z[0], 0.0])
	if np.linalg.norm(x) == 0:
	x = np.array([1.0, 0.0, 0.0])
	x = x / np.linalg.norm(x)
	y = np.cross(z, x)

	matrix = np.eye(4)
	matrix[:3,:3] = np.c_[x,y,z]
	nodes.append(pyrender.Node(
	light=pyrender.DirectionalLight(color=np.ones(3), intensity=1.0),
	matrix=matrix
	))

	return nodes

	class Renderer:

	def __init__(self, cfg: CfgNode, faces: np.array):
	"""
	Wrapper around the pyrender renderer to render MANO meshes.
	Args:
	cfg (CfgNode): Model config file.
	faces (np.array): Array of shape (F, 3) containing the mesh faces.
	"""
	self.cfg = cfg
	self.focal_length = cfg.EXTRA.FOCAL_LENGTH
	self.img_res = cfg.MODEL.IMAGE_SIZE

	# add faces that make the hand mesh watertight
	faces_new = np.array([[92, 38, 234],
	[234, 38, 239],
	[38, 122, 239],
	[239, 122, 279],
	[122, 118, 279],
	[279, 118, 215],
	[118, 117, 215],
	[215, 117, 214],
	[117, 119, 214],
	[214, 119, 121],
	[119, 120, 121],
	[121, 120, 78],
	[120, 108, 78],
	[78, 108, 79]])
	faces = np.concatenate([faces, faces_new], axis=0)

	self.camera_center = [self.img_res // 2, self.img_res // 2]
	self.faces = faces
	self.faces_left = self.faces[:,[0,2,1]]

	def __call__(self,
	vertices: np.array,
	camera_translation: np.array,
	image: torch.Tensor,
	full_frame: bool = False,
	imgname: Optional[str] = None,
	side_view=False, rot_angle=90,
	mesh_base_color=(1.0, 1.0, 0.9),
	scene_bg_color=(0,0,0),
	return_rgba=False,
	) -> np.array:
	"""
	Render meshes on input image
	Args:
	vertices (np.array): Array of shape (V, 3) containing the mesh vertices.
	camera_translation (np.array): Array of shape (3,) with the camera translation.
	image (torch.Tensor): Tensor of shape (3, H, W) containing the image crop with normalized pixel values.
	full_frame (bool): If True, then render on the full image.
	imgname (Optional[str]): Contains the original image filenamee. Used only if full_frame == True.
	"""

	if full_frame:
	image = cv2.imread(imgname).astype(np.float32)[:, :, ::-1] / 255.
	else:
	image = image.clone() * torch.tensor(self.cfg.MODEL.IMAGE_STD, device=image.device).reshape(3,1,1)
	image = image + torch.tensor(self.cfg.MODEL.IMAGE_MEAN, device=image.device).reshape(3,1,1)
	image = image.permute(1, 2, 0).cpu().numpy()

	renderer = pyrender.OffscreenRenderer(viewport_width=image.shape[1],
	viewport_height=image.shape[0],
	point_size=1.0)
	material = pyrender.MetallicRoughnessMaterial(
	metallicFactor=0.0,
	alphaMode='OPAQUE',
	baseColorFactor=(*mesh_base_color, 1.0))

	camera_translation[0] *= -1.

	mesh = trimesh.Trimesh(vertices.copy(), self.faces.copy())
	if side_view:
	rot = trimesh.transformations.rotation_matrix(
	np.radians(rot_angle), [0, 1, 0])
	mesh.apply_transform(rot)
	rot = trimesh.transformations.rotation_matrix(
	np.radians(180), [1, 0, 0])
	mesh.apply_transform(rot)
	mesh = pyrender.Mesh.from_trimesh(mesh, material=material)

	scene = pyrender.Scene(bg_color=[*scene_bg_color, 0.0],
	ambient_light=(0.3, 0.3, 0.3))
	scene.add(mesh, 'mesh')

	camera_pose = np.eye(4)
	camera_pose[:3, 3] = camera_translation
	camera_center = [image.shape[1] / 2., image.shape[0] / 2.]
	camera = pyrender.IntrinsicsCamera(fx=self.focal_length, fy=self.focal_length,
	cx=camera_center[0], cy=camera_center[1], zfar=1e12)
	scene.add(camera, pose=camera_pose)


	light_nodes = create_raymond_lights()
	for node in light_nodes:
	scene.add_node(node)

	color, rend_depth = renderer.render(scene, flags=pyrender.RenderFlags.RGBA)
	color = color.astype(np.float32) / 255.0
	renderer.delete()

	if return_rgba:
	return color

	valid_mask = (color[:, :, -1])[:, :, np.newaxis]
	if not side_view:
	output_img = (color[:, :, :3] * valid_mask + (1 - valid_mask) * image)
	else:
	output_img = color[:, :, :3]

	output_img = output_img.astype(np.float32)
	return output_img

	def vertices_to_trimesh(self, vertices, camera_translation, mesh_base_color=(1.0, 1.0, 0.9),
	rot_axis=[1,0,0], rot_angle=0, is_right=1):
	# material = pyrender.MetallicRoughnessMaterial(
	# metallicFactor=0.0,
	# alphaMode='OPAQUE',
	# baseColorFactor=(*mesh_base_color, 1.0))
	vertex_colors = np.array([(mesh_base_color, 1.0)] vertices.shape[0])
	if is_right:
	mesh = trimesh.Trimesh(vertices.copy() + camera_translation, self.faces.copy(), vertex_colors=vertex_colors)
	else:
	mesh = trimesh.Trimesh(vertices.copy() + camera_translation, self.faces_left.copy(), vertex_colors=vertex_colors)
	# mesh = trimesh.Trimesh(vertices.copy(), self.faces.copy())

	rot = trimesh.transformations.rotation_matrix(
	np.radians(rot_angle), rot_axis)
	mesh.apply_transform(rot)

	rot = trimesh.transformations.rotation_matrix(
	np.radians(180), [1, 0, 0])
	mesh.apply_transform(rot)
	return mesh

	def render_rgba(
	self,
	vertices: np.array,
	cam_t = None,
	rot=None,
	rot_axis=[1,0,0],
	rot_angle=0,
	camera_z=3,
	# camera_translation: np.array,
	mesh_base_color=(1.0, 1.0, 0.9),
	scene_bg_color=(0,0,0),
	render_res=[256, 256],
	focal_length=None,
	is_right=None,
	):

	renderer = pyrender.OffscreenRenderer(viewport_width=render_res[0],
	viewport_height=render_res[1],
	point_size=1.0)
	# material = pyrender.MetallicRoughnessMaterial(
	# metallicFactor=0.0,
	# alphaMode='OPAQUE',
	# baseColorFactor=(*mesh_base_color, 1.0))

	focal_length = focal_length if focal_length is not None else self.focal_length

	if cam_t is not None:
	camera_translation = cam_t.copy()
	camera_translation[0] *= -1.
	else:
	camera_translation = np.array([0, 0, camera_z * focal_length/render_res[1]])

	mesh = self.vertices_to_trimesh(vertices, np.array([0, 0, 0]), mesh_base_color, rot_axis, rot_angle, is_right=is_right)
	mesh = pyrender.Mesh.from_trimesh(mesh)
	# mesh = pyrender.Mesh.from_trimesh(mesh, material=material)

	scene = pyrender.Scene(bg_color=[*scene_bg_color, 0.0],
	ambient_light=(0.3, 0.3, 0.3))
	scene.add(mesh, 'mesh')

	camera_pose = np.eye(4)
	camera_pose[:3, 3] = camera_translation
	camera_center = [render_res[0] / 2., render_res[1] / 2.]
	camera = pyrender.IntrinsicsCamera(fx=focal_length, fy=focal_length,
	cx=camera_center[0], cy=camera_center[1], zfar=1e12)

	# Create camera node and add it to pyRender scene
	camera_node = pyrender.Node(camera=camera, matrix=camera_pose)
	scene.add_node(camera_node)
	self.add_point_lighting(scene, camera_node)
	self.add_lighting(scene, camera_node)

	light_nodes = create_raymond_lights()
	for node in light_nodes:
	scene.add_node(node)

	color, rend_depth = renderer.render(scene, flags=pyrender.RenderFlags.RGBA)
	color = color.astype(np.float32) / 255.0
	renderer.delete()

	return color

	def render_rgba_multiple(
	self,
	vertices: List[np.array],
	cam_t: List[np.array],
	rot_axis=[1,0,0],
	rot_angle=0,
	mesh_base_color=(1.0, 1.0, 0.9),
	scene_bg_color=(0,0,0),
	render_res=[256, 256],
	focal_length=None,
	is_right=None,
	):

	renderer = pyrender.OffscreenRenderer(viewport_width=render_res[0],
	viewport_height=render_res[1],
	point_size=1.0)
	# material = pyrender.MetallicRoughnessMaterial(
	# metallicFactor=0.0,
	# alphaMode='OPAQUE',
	# baseColorFactor=(*mesh_base_color, 1.0))

	if is_right is None:
	is_right = [1 for _ in range(len(vertices))]

	mesh_list = [pyrender.Mesh.from_trimesh(self.vertices_to_trimesh(vvv, ttt.copy(), mesh_base_color, rot_axis, rot_angle, is_right=sss)) for vvv,ttt,sss in zip(vertices, cam_t, is_right)]

	scene = pyrender.Scene(bg_color=[*scene_bg_color, 0.0],
	ambient_light=(0.3, 0.3, 0.3))
	for i,mesh in enumerate(mesh_list):
	scene.add(mesh, f'mesh_{i}')

	camera_pose = np.eye(4)
	# camera_pose[:3, 3] = camera_translation
	camera_center = [render_res[0] / 2., render_res[1] / 2.]
	focal_length = focal_length if focal_length is not None else self.focal_length
	camera = pyrender.IntrinsicsCamera(fx=focal_length, fy=focal_length,
	cx=camera_center[0], cy=camera_center[1], zfar=1e12)

	# Create camera node and add it to pyRender scene
	camera_node = pyrender.Node(camera=camera, matrix=camera_pose)
	scene.add_node(camera_node)
	self.add_point_lighting(scene, camera_node)
	self.add_lighting(scene, camera_node)

	light_nodes = create_raymond_lights()
	for node in light_nodes:
	scene.add_node(node)

	color, rend_depth = renderer.render(scene, flags=pyrender.RenderFlags.RGBA)
	color = color.astype(np.float32) / 255.0
	renderer.delete()

	return color

	def add_lighting(self, scene, cam_node, color=np.ones(3), intensity=1.0):
	# from phalp.visualize.py_renderer import get_light_poses
	light_poses = get_light_poses()
	light_poses.append(np.eye(4))
	cam_pose = scene.get_pose(cam_node)
	for i, pose in enumerate(light_poses):
	matrix = cam_pose @ pose
	node = pyrender.Node(
	name=f"light-{i:02d}",
	light=pyrender.DirectionalLight(color=color, intensity=intensity),
	matrix=matrix,
	)
	if scene.has_node(node):
	continue
	scene.add_node(node)

	def add_point_lighting(self, scene, cam_node, color=np.ones(3), intensity=1.0):
	# from phalp.visualize.py_renderer import get_light_poses
	light_poses = get_light_poses(dist=0.5)
	light_poses.append(np.eye(4))
	cam_pose = scene.get_pose(cam_node)
	for i, pose in enumerate(light_poses):
	matrix = cam_pose @ pose
	# node = pyrender.Node(
	# name=f"light-{i:02d}",
	# light=pyrender.DirectionalLight(color=color, intensity=intensity),
	# matrix=matrix,
	# )
	node = pyrender.Node(
	name=f"plight-{i:02d}",
	light=pyrender.PointLight(color=color, intensity=intensity),
	matrix=matrix,
	)
	if scene.has_node(node):
	continue
	scene.add_node(node)