EvalMDE / evalmde /visualization /render_contour_line.py

zeyuren2002

Add files using upload-large-folder tool

d547008 verified 1 day ago

11.6 kB

	import argparse
	import math
	from pathlib import Path
	import json

	from PIL import Image
	import cv2
	import torch
	from torchvision import transforms as torch_trans
	import numpy as np

	from evalmde.utils.proj import depth_to_xyz
	from evalmde.utils.common import assign_item_to_dict, pathlib_file
	from evalmde.utils.image import resize
	from evalmde.utils.image import imread_rgb
	from evalmde.utils.depth import load_data
	from evalmde.utils.np_and_th import get_shifted_data


	@torch.no_grad()
	def compute_grid_lb_ub(data, i, j):
	'''
	. . .

	-------------
	\|(0,0)\|(0,1)\|
	. ------.------ .
	\|(1,0)\|(1,1)\|
	-------------

	. . .
	'''
	if i == 0 and j == 0:
	x00 = .25 * (data[:-1, :-1] + data[:-1, 1:] + data[1:, :-1] + data[1:, 1:])
	x01 = .5 * (data[:-1, 1:] + data[1:, 1:])
	x10 = .5 * (data[1:, :-1] + data[1:, 1:])
	x11 = 1. * data[1:, 1:]
	elif i == 0 and j == 1:
	x00 = .5 * (data[:-1, :-1] + data[1:, :-1])
	x01 = .25 * (data[:-1, :-1] + data[:-1, 1:] + data[1:, :-1] + data[1:, 1:])
	x10 = 1. * data[1:, :-1]
	x11 = .5 * (data[1:, :-1] + data[1:, 1:])
	elif i == 1 and j == 0:
	x00 = .5 * (data[:-1, :-1] + data[:-1, 1:])
	x01 = 1. * data[:-1, 1:]
	x10 = .25 * (data[:-1, :-1] + data[:-1, 1:] + data[1:, :-1] + data[1:, 1:])
	x11 = .5 * (data[:-1, 1:] + data[1:, 1:])
	else:
	x00 = 1. * data[:-1, :-1]
	x01 = .5 * (data[:-1, :-1] + data[:-1, 1:])
	x10 = .5 * (data[:-1, :-1] + data[1:, :-1])
	x11 = .25 * (data[:-1, :-1] + data[:-1, 1:] + data[1:, :-1] + data[1:, 1:])
	x = torch.stack([x00, x01, x10, x11], dim=-1)
	lb, ub = x.min(dim=-1).values, x.max(dim=-1).values # (H - 1, W - 1), (H - 1, W - 1)
	del x
	return lb, ub


	@torch.no_grad()
	def compute_high_res_idx(high_res_shape, data_low_res, valid, valid_high_res, gap, val_lb):
	'''
	:param high_res_shape: (Hu, Wu)
	:param data_low_res: shape (Hl, Wl)
	:param valid_high_res: shape (Hl, Wl)
	:param gap:
	:param val_lb:
	:return: res_high_res
	res_high_res: shape (Hu, Wu)
	'''
	Hu, Wu = high_res_shape

	# fill invalid pixels with neighbor means
	data_low_res = data_low_res.clone()
	nb_data_sum = torch.zeros_like(data_low_res)
	nb_data_cnt = torch.zeros_like(data_low_res)
	for di in [-1, 0, 1]:
	for dj in [-1, 0, 1]:
	nb_valid = get_shifted_data(valid, di, dj)
	nb_data = get_shifted_data(data_low_res, di, dj)
	nb_data_sum[nb_valid] += nb_data[nb_valid]
	nb_data_cnt[nb_valid] += 1
	nb_data_sum[nb_data_cnt < .5] = 0
	data_low_res[~valid] = (nb_data_sum / nb_data_cnt.clamp(min=1))[~valid]

	data_high_res = torch_trans.functional.resize(data_low_res[None], (Hu, Wu), torch_trans.InterpolationMode.BILINEAR)[0]
	res_high_res = -torch.ones((Hu, Wu), dtype=torch.int32, device=data_high_res.device)

	for i in range(2):
	for j in range(2):
	lb, ub = compute_grid_lb_ub(data_high_res, i, j)
	lb_i = torch.clip(torch.ceil((lb - val_lb) / gap), min=0).to(res_high_res.dtype)
	ub_i = torch.clip(torch.floor((ub - val_lb) / gap), max=2e9).to(res_high_res.dtype)

	multi_line_mask = (lb_i < ub_i) \| ((lb_i == ub_i) & (res_high_res[1 - i: Hu - i, 1 - j: Wu - j] != -1))
	single_line_mask = (lb_i == ub_i) & (res_high_res[1 - i: Hu - i, 1 - j: Wu - j] == -1)

	res_high_res[1 - i: Hu - i, 1 - j: Wu - j][single_line_mask] = lb_i[single_line_mask]

	multi_line_upd_idx = torch.clip(torch.round((data_high_res[1 - i: Hu - i, 1 - j: Wu - j] - val_lb) / gap), min=0, max=2e9).to(res_high_res.dtype)
	multi_line_upd_idx = torch.where(multi_line_upd_idx < lb_i, lb_i, multi_line_upd_idx)
	multi_line_upd_idx = torch.where(multi_line_upd_idx > ub_i, ub_i, multi_line_upd_idx)
	multi_line_upd_mask = ((res_high_res[1 - i: Hu - i, 1 - j: Wu - j] == -1) \| (
	torch.abs(data_high_res[1 - i: Hu - i, 1 - j: Wu - j] - (res_high_res[1 - i: Hu - i, 1 - j: Wu - j] * gap + val_lb)) >
	torch.abs(data_high_res[1 - i: Hu - i, 1 - j: Wu - j] - (multi_line_upd_idx * gap + val_lb))
	)) & multi_line_mask
	res_high_res[1 - i: Hu - i, 1 - j: Wu - j][multi_line_upd_mask] = multi_line_upd_idx[multi_line_upd_mask]
	res_high_res[~valid_high_res] = -1
	return res_high_res


	def get_contour_line_gap(data: torch.Tensor, valid: torch.Tensor, num_gap, qt):
	if not valid.any():
	return 1
	qt_lb = data[valid].quantile(qt).item()
	qt_ub = data[valid].quantile(1 - qt).item()
	gap = (qt_ub - qt_lb) / (num_gap * (1 - qt * 2))
	return gap


	@torch.no_grad()
	def gen_contour_line(rgb_high_res, data, valid, valid_high_res, is_z, num_gap, shift, thickness=0, qt=0.05, colormap=cv2.COLORMAP_JET):
	device = 'cuda' if torch.cuda.is_available() else 'cpu'
	data = torch.from_numpy(data).to(device)
	valid = torch.from_numpy(valid).to(device)
	valid_high_res = torch.from_numpy(valid_high_res).to(device)
	if is_z:
	data = 1 / data

	gap = get_contour_line_gap(data, valid, num_gap, qt)
	data_lb = data[valid].min().item() if valid.any() else 0
	val_lb = data_lb + gap * shift

	high_res_shape = rgb_high_res.shape[:2]
	res_high_res = compute_high_res_idx(high_res_shape, data, valid, valid_high_res, gap, val_lb)

	res = res_high_res.clone()
	dlt_rng = int(math.floor(thickness))
	for di in range(-dlt_rng, dlt_rng + 1):
	for dj in range(-dlt_rng, dlt_rng + 1):
	if di * di + dj * dj > thickness * thickness:
	continue
	nb_res = get_shifted_data(res_high_res, di, dj)
	upd_mask = get_shifted_data(valid_high_res, di, dj) & (res == -1) & (nb_res != -1) & valid_high_res
	res[upd_mask] = nb_res[upd_mask]

	if (res != -1).any():
	res[res != -1] -= res[res != -1].min()
	res = res.cpu().numpy()
	num_val = max(2, res.max().item() + 1)
	valid_high_res = valid_high_res.cpu().numpy()

	base_col = cv2.applyColorMap(np.arange(256, dtype=np.uint8)[None], colormap)[0].astype(np.float32) # (256, 3)
	idx = np.arange(num_val, dtype=np.float32) / (num_val - 1) * 255 # (itr,)
	idx_lb = np.floor(idx).astype(np.int32) # (itr,)
	coef_lb = (idx_lb.astype(np.float32) + 1 - idx)[:, None] # (itr, 1)
	col = base_col[idx_lb] * coef_lb + base_col[np.clip(idx_lb + 1, a_min=None, a_max=255)] * (1 - coef_lb) # (itr, 3)
	col = np.round(col).astype(np.uint8)

	img = np.zeros_like(rgb_high_res)
	non_colored_mask = valid_high_res & (res == -1)
	img[non_colored_mask] = rgb_high_res[non_colored_mask]
	colored_mask = valid_high_res & (res != -1)
	img[colored_mask] = col[res[colored_mask]]
	return img, colored_mask, col


	def pil_ds(img: np.ndarray, H, W):
	pil_img = Image.fromarray(img, mode='RGB')
	pil_img = pil_img.resize((W, H), Image.Resampling.LANCZOS)
	return np.array(pil_img)


	def render_contour_line_imgs(xyz: np.ndarray, valid: np.ndarray, rgb_low_res: np.ndarray, save_shape, out_root):
	'''
	:param xyz:
	:param valid:
	:param rgb_low_res:
	:param save_shape: (H, W)
	:param out_root:
	:return:
	'''
	# hyperparams
	texture_strength = 0.8
	draw_dim_lb = 4 * np.linalg.norm([1920, 1080])

	out_root = pathlib_file(out_root)

	dim = np.linalg.norm(rgb_low_res.shape[:2])
	us_sc = int(math.ceil(draw_dim_lb / dim))
	us_shape = (us_sc * rgb_low_res.shape[0], us_sc * rgb_low_res.shape[1])
	rgb_high_res = np.round(texture_strength * cv2.resize(rgb_low_res, (us_shape[1], us_shape[0]))).astype(np.uint8)
	valid_high_res = torch_trans.functional.resize(torch.from_numpy(valid)[None], rgb_high_res.shape[:2], torch_trans.InterpolationMode.NEAREST_EXACT)[0].numpy()

	summary = {}
	for thickness in [5 * np.linalg.norm(rgb_high_res.shape[:2]) / (4 * np.linalg.norm([1920, 1080]))]:
	for rel_num_gap in [0.015, 0.03, 0.06, 0.09, 0.12, 0.24, 0.42, 0.6]:
	num_gap = int(dim * rel_num_gap)
	for shift in [0.5]:
	imgs, colored_masks, col_maps = {}, {}, {}
	for i, name in enumerate(['x', 'y', 'z']):
	imgs[name], colored_masks[name], col_maps[name] = \
	gen_contour_line(rgb_high_res, xyz[..., i], valid, valid_high_res, name == 'z',
	num_gap, shift, thickness)

	out_f = out_root / name / f'thickness__{thickness:.1f}___num_gap__{num_gap}___shift__{shift:.2f}.png'
	out_f.parent.mkdir(parents=True, exist_ok=True)
	cv2.imwrite(out_f.as_posix(), pil_ds(imgs[name][us_sc:-us_sc, us_sc:-us_sc, ::-1].copy(), save_shape[0], save_shape[1]))
	print(f'Saved to {out_f.resolve()}')
	assign_item_to_dict(summary, [name, thickness, num_gap, shift], str(out_f.resolve().relative_to(out_root.resolve())))

	img_xy = rgb_high_res.copy()
	img_xy[np.logical_and(colored_masks['x'], colored_masks['y'])] = np.round(.5 * (imgs['x'].astype(np.float32) + imgs['y'].astype(np.float32))).astype(np.uint8)[np.logical_and(colored_masks['x'], colored_masks['y'])]
	img_xy[np.logical_and(colored_masks['x'], np.logical_not(colored_masks['y']))] = imgs['x'][np.logical_and(colored_masks['x'], np.logical_not(colored_masks['y']))]
	img_xy[np.logical_and(np.logical_not(colored_masks['x']), colored_masks['y'])] = imgs['y'][np.logical_and(np.logical_not(colored_masks['x']), colored_masks['y'])]
	img_xy[~valid_high_res] = 0
	# img_xy = caption_img_xy(img_xy, col_maps)
	out_f = out_root / 'xy' / f'thickness__{thickness:.1f}___num_gap__{num_gap}___shift__{shift:.2f}.png'
	out_f.parent.mkdir(parents=True, exist_ok=True)
	cv2.imwrite(out_f.as_posix(), pil_ds(img_xy[us_sc:-us_sc, us_sc:-us_sc, ::-1].copy(), save_shape[0], save_shape[1]))
	print(f'Saved to {out_f.resolve()}')
	assign_item_to_dict(summary, ['xy', thickness, num_gap, shift], str(out_f.resolve().relative_to(out_root.resolve())))
	with (out_root / 'summary.json').open('w') as F:
	json.dump(summary, F)


	def get_out_dir(work_dir, depth_f):
	return work_dir / 'contour_line' / str((work_dir / depth_f).resolve().relative_to(work_dir.resolve()))[:-4].replace('/', '_')


	def main(args):
	save_dim_ub = args.save_dim_ub

	root = args.root
	rgb_f = root / args.rgb_f
	data_f = root / args.depth_f

	raw_rgb = imread_rgb(rgb_f)

	save_sc = int(math.floor(save_dim_ub / np.linalg.norm(raw_rgb.shape[:2])))
	save_shape = (save_sc * raw_rgb.shape[0], save_sc * raw_rgb.shape[1])

	depth, intr, valid = load_data(data_f)
	xyz = depth_to_xyz(intr, depth)

	render_contour_line_imgs(xyz, valid, raw_rgb, save_shape, get_out_dir(root, args.depth_f))


	if __name__ == "__main__":
	parser = argparse.ArgumentParser()
	parser.add_argument("root", type=Path)
	parser.add_argument("--depth_f", type=str, help='Path to depth file, relative to root.')
	parser.add_argument('--rgb_f', type=str, nargs='?', const=None, default='rgb.png', help='Path to rgb file, relative to root.')
	parser.add_argument("--save_dim_ub", type=float, default=np.linalg.norm([1920, 1080]))
	args = parser.parse_args()

	main(args)