Spaces:

whitphx
/

gradio-lite-transformers-js-depth-estimation

Running

App Files Files Community

gradio-lite-transformers-js-depth-estimation / index.html

whitphx HF staff

Fix: stop displaying `tensor.data` as it can't be serialized

c7f86e9 6 months ago

raw

history blame contribute delete

No virus

4.33 kB

	<!DOCTYPE html>
	<html>
	<head>
	<meta charset="utf-8">
	<meta name="viewport" content="width=device-width, initial-scale=1">
	<title>Gradio-Lite: Serverless Gradio Running Entirely in Your Browser</title>
	<meta name="description" content="Gradio-Lite: Serverless Gradio Running Entirely in Your Browser">

	<script type="module" crossorigin src="https://cdn.jsdelivr.net/npm/@gradio/lite/dist/lite.js"></script>
	<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/@gradio/lite/dist/lite.css" />

	<style>
	html, body {
	margin: 0;
	padding: 0;
	height: 100%;
	}
	</style>
	</head>
	<body>
	<gradio-lite>
	<gradio-file name="app.py" entrypoint>
	import gradio as gr
	import numpy as np
	import PIL
	import trimesh
	from transformers_js import import_transformers_js, as_url


	transformers = await import_transformers_js()
	pipeline = transformers.pipeline
	depth_estimator = await pipeline('depth-estimation', 'Xenova/depth-anything-small-hf');


	def depthmap_to_glb_trimesh(depth_map, rgb_image, file_path):
	assert depth_map.shape[:2] == rgb_image.shape[:2], "Depth map and RGB image must have the same dimensions"

	# Generate vertices and faces
	vertices = []
	colors = []
	faces = []

	height, width = depth_map.shape
	for y in range(height):
	for x in range(width):
	z = depth_map[y, x]
	vertices.append([x, y, z])
	colors.append(rgb_image[y, x])

	# Create faces (2 triangles per pixel, except for edges)
	for y in range(height - 1):
	for x in range(width - 1):
	top_left = y * width + x
	top_right = top_left + 1
	bottom_left = top_left + width
	bottom_right = bottom_left + 1

	faces.append([top_left, bottom_left, top_right])
	faces.append([top_right, bottom_left, bottom_right])

	# Convert to numpy arrays
	vertices = np.array(vertices, dtype=np.float64)
	colors = np.array(colors, dtype=np.uint8)
	faces = np.array(faces, dtype=np.int32)

	mesh = trimesh.Trimesh(vertices=vertices, faces=faces, vertex_colors=colors, process=False)

	# Export to GLB
	mesh.export(file_path, file_type='glb')


	def invert_depth(depth_map):
	max_depth = np.max(depth_map)
	return max_depth - depth_map


	def invert_xy(map):
	return map[::-1, ::-1]


	async def estimate(image_path, depth_scale):
	image = PIL.Image.open(image_path)
	image.thumbnail((384, 384)) # Resize the image keeping the aspect ratio

	predictions = await depth_estimator(as_url(image_path))

	depth_image = predictions["depth"].to_pil()

	tensor = predictions["predicted_depth"]
	tensor_data = {
	"dims": tensor.dims,
	"type": tensor.type,
	"size": tensor.size,
	}

	# Construct the 3D model from the depth map and the RGB image
	depth = predictions["predicted_depth"].to_numpy()
	depth = invert_depth(depth)
	depth = invert_xy(depth)

	depth = depth * depth_scale

	# The model outputs the depth map in a different size than the input image.
	# So we resize the depth map to match the original image size.
	depth = np.array(PIL.Image.fromarray(depth).resize(image.size))

	image_array = np.asarray(image)
	image_array = invert_xy(image_array)

	glb_file_path = "output.glb"
	depthmap_to_glb_trimesh(depth, image_array, glb_file_path)

	return depth_image, glb_file_path, tensor_data


	demo = gr.Interface(
	fn=estimate,
	inputs=[
	gr.Image(type="filepath"),
	gr.Slider(minimum=1, maximum=100, value=10, label="Depth Scale")
	],
	outputs=[
	gr.Image(label="Depth Image"),
	gr.Model3D(label="3D Model"),
	gr.JSON(label="Tensor"),
	],
	examples=[
	["bread_small.png"],
	["cats.jpg"],
	]
	)

	demo.launch()
	</gradio-file>

	<gradio-file name="bread_small.png" url="https://huggingface.co/datasets/Xenova/transformers.js-docs/resolve/main/bread_small.png" />
	<gradio-file name="cats.jpg" url="https://huggingface.co/datasets/Xenova/transformers.js-docs/resolve/main/cats.jpg" />

	<gradio-requirements>
	transformers_js_py
	trimesh
	</gradio-requirements>
	</gradio-lite>
	</body>
	</html>