Spaces:

MyNiuuu
/

MOFA-Video_Traj

Runtime error

myniu

init

826d651 6 months ago

7.86 kB

	# MIT License
	#
	# Copyright (c) 2018 Tom Runia
	#
	# Permission is hereby granted, free of charge, to any person obtaining a copy
	# of this software and associated documentation files (the "Software"), to deal
	# in the Software without restriction, including without limitation the rights
	# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
	# copies of the Software, and to permit persons to whom the Software is
	# furnished to do so, subject to conditions.
	#
	# Author: Tom Runia
	# Date Created: 2018-08-03

	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function

	import numpy as np
	from PIL import Image
	import torch


	def make_colorwheel():
	'''
	Generates a color wheel for optical flow visualization as presented in:
	Baker et al. "A Database and Evaluation Methodology for Optical Flow" (ICCV, 2007)
	URL: http://vision.middlebury.edu/flow/flowEval-iccv07.pdf
	According to the C++ source code of Daniel Scharstein
	According to the Matlab source code of Deqing Sun
	'''

	RY = 15
	YG = 6
	GC = 4
	CB = 11
	BM = 13
	MR = 6

	ncols = RY + YG + GC + CB + BM + MR
	colorwheel = np.zeros((ncols, 3))
	col = 0

	# RY
	colorwheel[0:RY, 0] = 255
	colorwheel[0:RY, 1] = np.floor(255 * np.arange(0, RY) / RY)
	col = col + RY
	# YG
	colorwheel[col:col + YG, 0] = 255 - np.floor(255 * np.arange(0, YG) / YG)
	colorwheel[col:col + YG, 1] = 255
	col = col + YG
	# GC
	colorwheel[col:col + GC, 1] = 255
	colorwheel[col:col + GC, 2] = np.floor(255 * np.arange(0, GC) / GC)
	col = col + GC
	# CB
	colorwheel[col:col + CB, 1] = 255 - np.floor(255 * np.arange(CB) / CB)
	colorwheel[col:col + CB, 2] = 255
	col = col + CB
	# BM
	colorwheel[col:col + BM, 2] = 255
	colorwheel[col:col + BM, 0] = np.floor(255 * np.arange(0, BM) / BM)
	col = col + BM
	# MR
	colorwheel[col:col + MR, 2] = 255 - np.floor(255 * np.arange(MR) / MR)
	colorwheel[col:col + MR, 0] = 255
	return colorwheel


	def flow_compute_color(u, v, convert_to_bgr=False):
	'''
	Applies the flow color wheel to (possibly clipped) flow components u and v.
	According to the C++ source code of Daniel Scharstein
	According to the Matlab source code of Deqing Sun
	:param u: np.ndarray, input horizontal flow
	:param v: np.ndarray, input vertical flow
	:param convert_to_bgr: bool, whether to change ordering and output BGR instead of RGB
	:return:
	'''

	flow_image = np.zeros((u.shape[0], u.shape[1], 3), np.uint8)

	colorwheel = make_colorwheel() # shape [55x3]
	ncols = colorwheel.shape[0]

	rad = np.sqrt(np.square(u) + np.square(v))
	a = np.arctan2(-v, -u) / np.pi

	fk = (a + 1) / 2 * (ncols - 1) + 1
	k0 = np.floor(fk).astype(np.int32)
	k1 = k0 + 1
	k1[k1 == ncols] = 1
	f = fk - k0

	for i in range(colorwheel.shape[1]):
	tmp = colorwheel[:, i]
	col0 = tmp[k0] / 255.0
	col1 = tmp[k1] / 255.0
	col = (1 - f) * col0 + f * col1

	idx = (rad <= 1)
	col[idx] = 1 - rad[idx] * (1 - col[idx])
	col[~idx] = col[~idx] * 0.75 # out of range?

	# Note the 2-i => BGR instead of RGB
	ch_idx = 2 - i if convert_to_bgr else i
	flow_image[:, :, ch_idx] = np.floor(255 * col)

	return flow_image


	def flow_to_color(flow_uv, clip_flow=None, convert_to_bgr=False):
	'''
	Expects a two dimensional flow image of shape [H,W,2]
	According to the C++ source code of Daniel Scharstein
	According to the Matlab source code of Deqing Sun
	:param flow_uv: np.ndarray of shape [H,W,2]
	:param clip_flow: float, maximum clipping value for flow
	:return:
	'''

	assert flow_uv.ndim == 3, 'input flow must have three dimensions'
	assert flow_uv.shape[2] == 2, 'input flow must have shape [H,W,2]'

	if clip_flow is not None:
	flow_uv = np.clip(flow_uv, 0, clip_flow)

	u = flow_uv[:, :, 0]
	v = flow_uv[:, :, 1]

	rad = np.sqrt(np.square(u) + np.square(v))
	rad_max = np.max(rad)

	epsilon = 1e-5
	u = u / (rad_max + epsilon)
	v = v / (rad_max + epsilon)

	return flow_compute_color(u, v, convert_to_bgr)


	UNKNOWN_FLOW_THRESH = 1e7
	SMALLFLOW = 0.0
	LARGEFLOW = 1e8


	def make_color_wheel():
	"""
	Generate color wheel according Middlebury color code
	:return: Color wheel
	"""
	RY = 15
	YG = 6
	GC = 4
	CB = 11
	BM = 13
	MR = 6

	ncols = RY + YG + GC + CB + BM + MR

	colorwheel = np.zeros([ncols, 3])

	col = 0

	# RY
	colorwheel[0:RY, 0] = 255
	colorwheel[0:RY, 1] = np.transpose(np.floor(255 * np.arange(0, RY) / RY))
	col += RY

	# YG
	colorwheel[col:col + YG, 0] = 255 - np.transpose(np.floor(255 * np.arange(0, YG) / YG))
	colorwheel[col:col + YG, 1] = 255
	col += YG

	# GC
	colorwheel[col:col + GC, 1] = 255
	colorwheel[col:col + GC, 2] = np.transpose(np.floor(255 * np.arange(0, GC) / GC))
	col += GC

	# CB
	colorwheel[col:col + CB, 1] = 255 - np.transpose(np.floor(255 * np.arange(0, CB) / CB))
	colorwheel[col:col + CB, 2] = 255
	col += CB

	# BM
	colorwheel[col:col + BM, 2] = 255
	colorwheel[col:col + BM, 0] = np.transpose(np.floor(255 * np.arange(0, BM) / BM))
	col += + BM

	# MR
	colorwheel[col:col + MR, 2] = 255 - np.transpose(np.floor(255 * np.arange(0, MR) / MR))
	colorwheel[col:col + MR, 0] = 255

	return colorwheel


	def compute_color(u, v):
	"""
	compute optical flow color map
	:param u: optical flow horizontal map
	:param v: optical flow vertical map
	:return: optical flow in color code
	"""
	[h, w] = u.shape
	img = np.zeros([h, w, 3])
	nanIdx = np.isnan(u) \| np.isnan(v)
	u[nanIdx] = 0
	v[nanIdx] = 0

	colorwheel = make_color_wheel()
	ncols = np.size(colorwheel, 0)

	rad = np.sqrt(u 2 + v 2)

	a = np.arctan2(-v, -u) / np.pi

	fk = (a + 1) / 2 * (ncols - 1) + 1

	k0 = np.floor(fk).astype(int)

	k1 = k0 + 1
	k1[k1 == ncols + 1] = 1
	f = fk - k0

	for i in range(0, np.size(colorwheel, 1)):
	tmp = colorwheel[:, i]
	col0 = tmp[k0 - 1] / 255
	col1 = tmp[k1 - 1] / 255
	col = (1 - f) * col0 + f * col1

	idx = rad <= 1
	col[idx] = 1 - rad[idx] * (1 - col[idx])
	notidx = np.logical_not(idx)

	col[notidx] *= 0.75
	img[:, :, i] = np.uint8(np.floor(255 * col * (1 - nanIdx)))

	return img


	# from https://github.com/gengshan-y/VCN
	def flow_to_image(flow):
	"""
	Convert flow into middlebury color code image
	:param flow: optical flow map
	:return: optical flow image in middlebury color
	"""
	u = flow[:, :, 0]
	v = flow[:, :, 1]

	# maxu = -999.
	# maxv = -999.
	# minu = 999.
	# minv = 999.

	idxUnknow = (abs(u) > UNKNOWN_FLOW_THRESH) \| (abs(v) > UNKNOWN_FLOW_THRESH)
	u[idxUnknow] = 0
	v[idxUnknow] = 0

	# maxu = max(maxu, np.max(u))
	# minu = min(minu, np.min(u))

	# maxv = max(maxv, np.max(v))
	# minv = min(minv, np.min(v))

	rad = torch.sqrt(u 2 + v 2)
	maxrad = max(-1, torch.max(rad).cpu().numpy())

	u = u / (maxrad + np.finfo(float).eps)
	v = v / (maxrad + np.finfo(float).eps)

	img = compute_color(u.cpu().numpy(), v.cpu().numpy())

	idx = np.repeat(idxUnknow[:, :, np.newaxis].cpu().numpy(), 3, axis=2)
	img[idx] = 0

	return np.uint8(img)


	def save_vis_flow_tofile(flow, output_path):
	vis_flow = flow_to_image(flow)
	Image.fromarray(vis_flow).save(output_path)


	def flow_tensor_to_image(flow):
	"""Used for tensorboard visualization"""
	flow = flow.permute(1, 2, 0) # [H, W, 2]
	flow = flow.detach().cpu().numpy()
	flow = flow_to_image(flow) # [H, W, 3]
	flow = np.transpose(flow, (2, 0, 1)) # [3, H, W]

	return flow