Spaces:

mmlab-ntu
/

Segment-Any-RGBD

Runtime error

Segment-Any-RGBD / datasets /scannet_preprocess /scannet_pair /point_cloud_extractor.py

Jingkang Yang

first commit

bd27f44 about 2 years ago

3.56 kB

	# Copyright (c) Facebook, Inc. and its affiliates.
	#
	# This source code is licensed under the MIT license found in the
	# LICENSE file in the root directory of this source tree.


	import glob, os
	import numpy as np
	import cv2
	import torch


	def extractor(input_path, output_path):
	if not os.path.exists(output_path):
	os.mkdir(output_path)

	# Load Depth Camera Intrinsic
	depth_intrinsic = np.loadtxt(input_path + '/intrinsic/intrinsic_depth.txt')
	print('Depth intrinsic: ')
	print(depth_intrinsic)

	# Compute Camrea Distance (just for demo, so you can choose the camera distance in frame sampling)
	poses = sorted(glob.glob(input_path + '/pose/*.txt'), key=lambda a: int(os.path.basename(a).split('.')[0]))
	depths = sorted(glob.glob(input_path + '/depth/*.png'), key=lambda a: int(os.path.basename(a).split('.')[0]))
	colors = sorted(glob.glob(input_path + '/color/*.png'), key=lambda a: int(os.path.basename(a).split('.')[0]))

	# # Get Aligned Point Clouds.
	for ind, (pose, depth, color) in enumerate(zip(poses, depths, colors)):
	name = os.path.basename(pose).split('.')[0]

	if os.path.exists(output_path + '/{}.npz'.format(name)):
	continue

	try:
	print('=' * 50, ': {}'.format(pose))
	depth_img = cv2.imread(depth, -1) # read 16bit grayscale image
	mask = (depth_img != 0)
	color_image = cv2.imread(color)
	color_image = cv2.resize(color_image, (640, 480))
	color_image = np.reshape(color_image[mask], [-1, 3])
	colors = np.zeros_like(color_image)
	colors[:, 0] = color_image[:, 2]
	colors[:, 1] = color_image[:, 1]
	colors[:, 2] = color_image[:, 0]

	pose = np.loadtxt(poses[ind])
	print('Camera pose: ')
	print(pose)

	depth_shift = 1000.0
	x, y = np.meshgrid(np.linspace(0, depth_img.shape[1] - 1, depth_img.shape[1]),
	np.linspace(0, depth_img.shape[0] - 1, depth_img.shape[0]))
	uv_depth = np.zeros((depth_img.shape[0], depth_img.shape[1], 3))
	uv_depth[:, :, 0] = x
	uv_depth[:, :, 1] = y
	uv_depth[:, :, 2] = depth_img / depth_shift
	uv_depth = np.reshape(uv_depth, [-1, 3])
	uv_depth = uv_depth[np.where(uv_depth[:, 2] != 0), :].squeeze()

	intrinsic_inv = np.linalg.inv(depth_intrinsic)
	fx = depth_intrinsic[0, 0]
	fy = depth_intrinsic[1, 1]
	cx = depth_intrinsic[0, 2]
	cy = depth_intrinsic[1, 2]
	bx = depth_intrinsic[0, 3]
	by = depth_intrinsic[1, 3]
	point_list = []
	n = uv_depth.shape[0]
	points = np.ones((n, 4))
	X = (uv_depth[:, 0] - cx) * uv_depth[:, 2] / fx + bx
	Y = (uv_depth[:, 1] - cy) * uv_depth[:, 2] / fy + by
	points[:, 0] = X
	points[:, 1] = Y
	points[:, 2] = uv_depth[:, 2]
	points_world = np.dot(points, np.transpose(pose))
	print(points_world.shape)

	pcd = dict(coord=points_world[:, :3], color=colors)
	# pcd_save = np.zeros((points_world.shape[0], 7))
	# pcd_save[:, :3] = points_world[:, :3]
	# pcd_save[:, 3:6] = colors

	# print('Saving npz file...')
	# np.savez(output_path + '/{}.npz'.format(name), pcd=pcd_save)
	torch.save(pcd, output_path + '/{}.pth'.format(name))
	except:
	continue