Huiwenshi's picture
Upload folder using huggingface_hub
0514ca2 verified
raw
history blame
5.99 kB
# Copyright (C) 2022-present Naver Corporation. All rights reserved.
# Licensed under CC BY-NC-SA 4.0 (non-commercial use only).
"""
Paths to Habitat-Sim scenes
"""
import os
import json
import collections
from tqdm import tqdm
# Hardcoded path to the different scene datasets
SCENES_DATASET = {
"hm3d": "./data/habitat-sim-data/scene_datasets/hm3d/",
"gibson": "./data/habitat-sim-data/scene_datasets/gibson/",
"habitat-test-scenes": "./data/habitat-sim/scene_datasets/habitat-test-scenes/",
"replica_cad_baked_lighting": "./data/habitat-sim/scene_datasets/replica_cad_baked_lighting/",
"replica_cad": "./data/habitat-sim/scene_datasets/replica_cad/",
"replica": "./data/habitat-sim/scene_datasets/ReplicaDataset/",
"scannet": "./data/habitat-sim/scene_datasets/scannet/"
}
SceneData = collections.namedtuple("SceneData", ["scene_dataset_config_file", "scene", "navmesh", "output_dir"])
def list_replicacad_scenes(base_output_dir, base_path=SCENES_DATASET["replica_cad"]):
scene_dataset_config_file = os.path.join(base_path, "replicaCAD.scene_dataset_config.json")
scenes = [f"apt_{i}" for i in range(6)] + ["empty_stage"]
navmeshes = [f"navmeshes/apt_{i}_static_furniture.navmesh" for i in range(6)] + ["empty_stage.navmesh"]
scenes_data = []
for idx in range(len(scenes)):
output_dir = os.path.join(base_output_dir, "ReplicaCAD", scenes[idx])
# Add scene
data = SceneData(scene_dataset_config_file=scene_dataset_config_file,
scene = scenes[idx] + ".scene_instance.json",
navmesh = os.path.join(base_path, navmeshes[idx]),
output_dir = output_dir)
scenes_data.append(data)
return scenes_data
def list_replica_cad_baked_lighting_scenes(base_output_dir, base_path=SCENES_DATASET["replica_cad_baked_lighting"]):
scene_dataset_config_file = os.path.join(base_path, "replicaCAD_baked.scene_dataset_config.json")
scenes = sum([[f"Baked_sc{i}_staging_{j:02}" for i in range(5)] for j in range(21)], [])
navmeshes = ""#[f"navmeshes/apt_{i}_static_furniture.navmesh" for i in range(6)] + ["empty_stage.navmesh"]
scenes_data = []
for idx in range(len(scenes)):
output_dir = os.path.join(base_output_dir, "replica_cad_baked_lighting", scenes[idx])
data = SceneData(scene_dataset_config_file=scene_dataset_config_file,
scene = scenes[idx],
navmesh = "",
output_dir = output_dir)
scenes_data.append(data)
return scenes_data
def list_replica_scenes(base_output_dir, base_path):
scenes_data = []
for scene_id in os.listdir(base_path):
scene = os.path.join(base_path, scene_id, "mesh.ply")
navmesh = os.path.join(base_path, scene_id, "habitat/mesh_preseg_semantic.navmesh") # Not sure if I should use it
scene_dataset_config_file = ""
output_dir = os.path.join(base_output_dir, scene_id)
# Add scene only if it does not exist already, or if exist_ok
data = SceneData(scene_dataset_config_file = scene_dataset_config_file,
scene = scene,
navmesh = navmesh,
output_dir = output_dir)
scenes_data.append(data)
return scenes_data
def list_scenes(base_output_dir, base_path):
"""
Generic method iterating through a base_path folder to find scenes.
"""
scenes_data = []
for root, dirs, files in os.walk(base_path, followlinks=True):
folder_scenes_data = []
for file in files:
name, ext = os.path.splitext(file)
if ext == ".glb":
scene = os.path.join(root, name + ".glb")
navmesh = os.path.join(root, name + ".navmesh")
if not os.path.exists(navmesh):
navmesh = ""
relpath = os.path.relpath(root, base_path)
output_dir = os.path.abspath(os.path.join(base_output_dir, relpath, name))
data = SceneData(scene_dataset_config_file="",
scene = scene,
navmesh = navmesh,
output_dir = output_dir)
folder_scenes_data.append(data)
# Specific check for HM3D:
# When two meshesxxxx.basis.glb and xxxx.glb are present, use the 'basis' version.
basis_scenes = [data.scene[:-len(".basis.glb")] for data in folder_scenes_data if data.scene.endswith(".basis.glb")]
if len(basis_scenes) != 0:
folder_scenes_data = [data for data in folder_scenes_data if not (data.scene[:-len(".glb")] in basis_scenes)]
scenes_data.extend(folder_scenes_data)
return scenes_data
def list_scenes_available(base_output_dir, scenes_dataset_paths=SCENES_DATASET):
scenes_data = []
# HM3D
for split in ("minival", "train", "val", "examples"):
scenes_data += list_scenes(base_output_dir=os.path.join(base_output_dir, f"hm3d/{split}/"),
base_path=f"{scenes_dataset_paths['hm3d']}/{split}")
# Gibson
scenes_data += list_scenes(base_output_dir=os.path.join(base_output_dir, "gibson"),
base_path=scenes_dataset_paths["gibson"])
# Habitat test scenes (just a few)
scenes_data += list_scenes(base_output_dir=os.path.join(base_output_dir, "habitat-test-scenes"),
base_path=scenes_dataset_paths["habitat-test-scenes"])
# ReplicaCAD (baked lightning)
scenes_data += list_replica_cad_baked_lighting_scenes(base_output_dir=base_output_dir)
# ScanNet
scenes_data += list_scenes(base_output_dir=os.path.join(base_output_dir, "scannet"),
base_path=scenes_dataset_paths["scannet"])
# Replica
list_replica_scenes(base_output_dir=os.path.join(base_output_dir, "replica"),
base_path=scenes_dataset_paths["replica"])
return scenes_data