Spaces:

nev
/

dalle-6D

Runtime error

App Files Files Community

neverix commited on Jul 18, 2022

Commit

2ddc005

1 Parent(s): e2dc8d7

First prototype?

Browse files

Files changed (2) hide show

app.py +90 -1
packages.txt +1 -0

app.py CHANGED Viewed

@@ -1,7 +1,13 @@
 from PIL import Image
 import gradio as gr
 import numpy as np
 import torch
 class MidasDepth(object):
@@ -27,9 +33,91 @@ class MidasDepth(object):
         return prediction.detach().cpu().numpy()
 def main():
     midas = MidasDepth()
-    interface = gr.Interface(fn=lambda x, *t: [Image.fromarray(midas.get_depth(x).astype("uint8")), None], inputs=[
         gr.inputs.Image(label="src", type="numpy"),
         gr.inputs.Number(label="tx", default=0.0),
         gr.inputs.Number(label="ty", default=0.0),
@@ -38,6 +126,7 @@ def main():
         gr.inputs.Number(label="ry", default=0.0),
         gr.inputs.Number(label="rz", default=0.0)
     ], outputs=[
         gr.outputs.Image(type="numpy"),
         gr.outputs.Video()
     ], title="DALL·E 6D", description="Lift DALL·E 2 (or any other model) into 3D!")

+from tqdm.auto import trange
 from PIL import Image
 import gradio as gr
 import numpy as np
+import pyrender
+import trimesh
+import scipy
 import torch
+import cv2
+import os
 class MidasDepth(object):
         return prediction.detach().cpu().numpy()
+def process_depth(dep):
+    depth = dep.copy()
+    depth -= depth.min()
+    depth /= depth.max()
+    depth = 1 / np.clip(depth, 0.2, 1)
+    blurred = cv2.medianBlur(depth, 5)  # 9 not available because it requires 8-bit
+    maxd = cv2.dilate(blurred, np.ones((3, 3)))
+    mind = cv2.erode(blurred, np.ones((3, 3)))
+    edges = maxd - mind
+    threshold = .05  # Better to have false positives
+    pick_edges = edges > threshold
+    return depth, pick_edges
+def make_mesh(pic, depth, pick_edges):
+    faces = []
+    im = np.asarray(pic)
+    grid = np.mgrid[0:im.shape[0], 0:im.shape[1]].transpose(1, 2, 0
+                                                            ).reshape(-1, 2)[..., ::-1]
+    flat_grid = grid[:, 1] * im.shape[1] + grid[:, 0]
+    positions = np.concatenate(((grid - np.array(im.shape[:-1])[np.newaxis, :]
+                                 / 2) / im.shape[1] * 2,
+                                depth.flatten()[flat_grid][..., np.newaxis]),
+                               axis=-1)
+    positions[:, :-1] *= positions[:, -1:]
+    positions[:, 1] *= -1
+    colors = im.reshape(-1, 3)[flat_grid]
+    c = lambda x, y: y * im.shape[1] + x
+    for y in trange(im.shape[0]):
+        for x in range(im.shape[1]):
+            if pick_edges[y, x]:
+                continue
+            if x > 0 and y > 0:
+                faces.append([c(x, y), c(x, y - 1), c(x - 1, y)])
+            if x < im.shape[1] - 1 and y < im.shape[0] - 1:
+                faces.append([c(x, y), c(x, y + 1), c(x + 1, y)])
+    face_colors = np.asarray([colors[i[0]] for i in faces])
+    tri_mesh = trimesh.Trimesh(vertices=positions * np.array([1.0, 1.0, -1.0]),
+                               faces=faces,
+                               face_colors=np.concatenate((face_colors,
+                                                           face_colors[..., -1:]
+                                                           * 0 + 255),
+                                                          axis=-1).reshape(-1, 4),
+                               smooth=False,
+                               )
+    return tri_mesh
+def args_to_mat(tx, ty, tz, rx, ry, rz):
+    mat = np.eye(4)
+    mat[:3, :3] = scipy.spatial.Rotation.from_euler("XYZ", (rx, ry, rz)).as_matrix()
+    mat[:3, 3] = tx, ty, tz
+    return mat
+def render(mesh, mat):
+    scene = pyrender.Scene(ambient_light=np.array([1.0, 1.0, 1.0]))
+    camera = pyrender.PerspectiveCamera(yfov=np.pi / 2, aspectRatio=1.0)
+    scene.add(camera, pose=mat)
+    scene.add(mesh)
+    r = pyrender.OffscreenRenderer(1024, 1024)
+    rgb, d = r.render(scene, pyrender.constants.RenderFlags.FLAT)
+    mask = d == 0
+    rgb = rgb.copy()
+    rgb[mask] = 0
+    res = Image.fromarray(np.concatenate((rgb,
+                                          ((mask[..., np.newaxis]) == 0)
+                                          .astype(np.uint8) * 255), axis=-1))
+    return res
 def main():
+    os.environ["PYOPENGL_PLATFORM"] = "osmesa"
     midas = MidasDepth()
+    def fn(pic, *args):
+        depth, pick_edges = process_depth(midas.get_depth(pic))
+        mesh = make_mesh(pic, depth, pick_edges)
+        frame = render(mesh, args_to_mat(*args))
+        return np.asarray(frame), (255 / np.asarray(depth)).astype(np.uint8), None
+    interface = gr.Interface(fn=fn, inputs=[
         gr.inputs.Image(label="src", type="numpy"),
         gr.inputs.Number(label="tx", default=0.0),
         gr.inputs.Number(label="ty", default=0.0),
         gr.inputs.Number(label="ry", default=0.0),
         gr.inputs.Number(label="rz", default=0.0)
     ], outputs=[
+        gr.outputs.Image(type="numpy"),
         gr.outputs.Image(type="numpy"),
         gr.outputs.Video()
     ], title="DALL·E 6D", description="Lift DALL·E 2 (or any other model) into 3D!")

packages.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ mesa-utils