Spaces:

Realcat
/

image-matching-webui

Running

image-matching-webui / third_party /mast3r /dust3r /datasets_preprocess /habitat /preprocess_habitat.py

Realcat

add: mast3r

f90241e 6 months ago

5.6 kB

	#!/usr/bin/env python3
	# Copyright (C) 2024-present Naver Corporation. All rights reserved.
	# Licensed under CC BY-NC-SA 4.0 (non-commercial use only).
	#
	# --------------------------------------------------------
	# main executable for preprocessing habitat
	# export METADATA_DIR="/path/to/habitat/5views_v1_512x512_metadata"
	# export SCENES_DIR="/path/to/habitat/data/scene_datasets/"
	# export OUTPUT_DIR="data/habitat_processed"
	# export PYTHONPATH=$(pwd)
	# python preprocess_habitat.py --scenes_dir=$SCENES_DIR --metadata_dir=$METADATA_DIR --output_dir=$OUTPUT_DIR \| parallel -j 16
	# --------------------------------------------------------
	import os
	import glob
	import json
	import os

	import PIL.Image
	import json
	os.environ["OPENCV_IO_ENABLE_OPENEXR"] = "1" # noqa
	import cv2
	from habitat_renderer import multiview_crop_generator
	from tqdm import tqdm


	def preprocess_metadata(metadata_filename,
	scenes_dir,
	output_dir,
	crop_resolution=[512, 512],
	equirectangular_resolution=None,
	fix_existing_dataset=False):
	# Load data
	with open(metadata_filename, "r") as f:
	metadata = json.load(f)

	if metadata["scene_dataset_config_file"] == "":
	scene = os.path.join(scenes_dir, metadata["scene"])
	scene_dataset_config_file = ""
	else:
	scene = metadata["scene"]
	scene_dataset_config_file = os.path.join(scenes_dir, metadata["scene_dataset_config_file"])
	navmesh = None

	# Use 4 times the crop size as resolution for rendering the environment map.
	max_res = max(crop_resolution)

	if equirectangular_resolution == None:
	# Use 4 times the crop size as resolution for rendering the environment map.
	max_res = max(crop_resolution)
	equirectangular_resolution = (4max_res, 8max_res)

	print("equirectangular_resolution:", equirectangular_resolution)

	if os.path.exists(output_dir) and not fix_existing_dataset:
	raise FileExistsError(output_dir)

	# Lazy initialization
	highres_dataset = None

	for batch_label, batch in tqdm(metadata["view_batches"].items()):
	for view_label, view_params in batch.items():

	assert view_params["size"] == crop_resolution
	label = f"{batch_label}_{view_label}"

	output_camera_params_filename = os.path.join(output_dir, f"{label}_camera_params.json")
	if fix_existing_dataset and os.path.isfile(output_camera_params_filename):
	# Skip generation if we are fixing a dataset and the corresponding output file already exists
	continue

	# Lazy initialization
	if highres_dataset is None:
	highres_dataset = multiview_crop_generator.HabitatMultiviewCrops(scene=scene,
	navmesh=navmesh,
	scene_dataset_config_file=scene_dataset_config_file,
	equirectangular_resolution=equirectangular_resolution,
	crop_resolution=crop_resolution,)
	os.makedirs(output_dir, exist_ok=bool(fix_existing_dataset))

	# Generate a higher resolution crop
	original_projection, position = multiview_crop_generator.dict_to_perspective_projection(view_params)
	# Render an envmap at the given position
	viewpoint_data = highres_dataset.render_viewpoint_data(position)

	projection = original_projection
	colormap, depthmap, pointmap, _ = highres_dataset.extract_cropped_camera(
	projection, viewpoint_data.colormap, viewpoint_data.distancemap, viewpoint_data.pointmap)

	camera_params = multiview_crop_generator.perspective_projection_to_dict(projection, position)

	# Color image
	PIL.Image.fromarray(colormap).save(os.path.join(output_dir, f"{label}.jpeg"))
	# Depth image
	cv2.imwrite(os.path.join(output_dir, f"{label}_depth.exr"),
	depthmap, [cv2.IMWRITE_EXR_TYPE, cv2.IMWRITE_EXR_TYPE_HALF])
	# Camera parameters
	with open(output_camera_params_filename, "w") as f:
	json.dump(camera_params, f)


	if __name__ == "__main__":
	import argparse
	parser = argparse.ArgumentParser()
	parser.add_argument("--metadata_dir", required=True)
	parser.add_argument("--scenes_dir", required=True)
	parser.add_argument("--output_dir", required=True)
	parser.add_argument("--metadata_filename", default="")

	args = parser.parse_args()

	if args.metadata_filename == "":
	# Walk through the metadata dir to generate commandlines
	for filename in glob.iglob(os.path.join(args.metadata_dir, "**/metadata.json"), recursive=True):
	output_dir = os.path.join(args.output_dir, os.path.relpath(os.path.dirname(filename), args.metadata_dir))
	if not os.path.exists(output_dir):
	commandline = f"python {__file__} --metadata_filename={filename} --metadata_dir={args.metadata_dir} --scenes_dir={args.scenes_dir} --output_dir={output_dir}"
	print(commandline)
	else:
	preprocess_metadata(metadata_filename=args.metadata_filename,
	scenes_dir=args.scenes_dir,
	output_dir=args.output_dir)