Spaces:

AdamYao
/

Diving-into-the-Fusion-of-Monocular-Priors-for-Generalized-Stereo-Matching

Sleeping

Diving-into-the-Fusion-of-Monocular-Priors-for-Generalized-Stereo-Matching / core /utils /frame_utils.py

BFZD233

initial

f06f310 5 months ago

8.62 kB

	import os
	import numpy as np
	from PIL import Image
	from os.path import *
	import re
	import json
	import imageio
	import cv2
	cv2.setNumThreads(0)
	cv2.ocl.setUseOpenCL(False)

	TAG_CHAR = np.array([202021.25], np.float32)

	def readFlow(fn):
	""" Read .flo file in Middlebury format"""
	# Code adapted from:
	# http://stackoverflow.com/questions/28013200/reading-middlebury-flow-files-with-python-bytes-array-numpy

	# WARNING: this will work on little-endian architectures (eg Intel x86) only!
	# print 'fn = %s'%(fn)
	with open(fn, 'rb') as f:
	magic = np.fromfile(f, np.float32, count=1)
	if 202021.25 != magic:
	print('Magic number incorrect. Invalid .flo file')
	return None
	else:
	w = np.fromfile(f, np.int32, count=1)
	h = np.fromfile(f, np.int32, count=1)
	# print 'Reading %d x %d flo file\n' % (w, h)
	data = np.fromfile(f, np.float32, count=2int(w)int(h))
	# Reshape data into 3D array (columns, rows, bands)
	# The reshape here is for visualization, the original code is (w,h,2)
	return np.resize(data, (int(h), int(w), 2))

	def readPFM(file):
	file = open(file, 'rb')

	color = None
	width = None
	height = None
	scale = None
	endian = None

	header = file.readline().rstrip()
	if header == b'PF':
	color = True
	elif header == b'Pf':
	color = False
	else:
	raise Exception('Not a PFM file.')

	dim_match = re.match(rb'^(\d+)\s(\d+)\s$', file.readline())
	if dim_match:
	width, height = map(int, dim_match.groups())
	else:
	raise Exception('Malformed PFM header.')

	scale = float(file.readline().rstrip())
	if scale < 0: # little-endian
	endian = '<'
	scale = -scale
	else:
	endian = '>' # big-endian

	data = np.fromfile(file, endian + 'f')
	shape = (height, width, 3) if color else (height, width)

	data = np.reshape(data, shape)
	data = np.flipud(data)
	return data

	def writePFM(file, array):
	import os
	assert type(file) is str and type(array) is np.ndarray and \
	os.path.splitext(file)[1] == ".pfm"
	with open(file, 'wb') as f:
	H, W = array.shape
	headers = ["Pf\n", f"{W} {H}\n", "-1\n"]
	for header in headers:
	f.write(str.encode(header))
	array = np.flip(array, axis=0).astype(np.float32)
	f.write(array.tobytes())



	def writeFlow(filename,uv,v=None):
	""" Write optical flow to file.

	If v is None, uv is assumed to contain both u and v channels,
	stacked in depth.
	Original code by Deqing Sun, adapted from Daniel Scharstein.
	"""
	nBands = 2

	if v is None:
	assert(uv.ndim == 3)
	assert(uv.shape[2] == 2)
	u = uv[:,:,0]
	v = uv[:,:,1]
	else:
	u = uv

	assert(u.shape == v.shape)
	height,width = u.shape
	f = open(filename,'wb')
	# write the header
	f.write(TAG_CHAR)
	np.array(width).astype(np.int32).tofile(f)
	np.array(height).astype(np.int32).tofile(f)
	# arrange into matrix form
	tmp = np.zeros((height, width*nBands))
	tmp[:,np.arange(width)*2] = u
	tmp[:,np.arange(width)*2 + 1] = v
	tmp.astype(np.float32).tofile(f)
	f.close()


	def readFlowKITTI(filename):
	flow = cv2.imread(filename, cv2.IMREAD_ANYDEPTH\|cv2.IMREAD_COLOR)
	flow = flow[:,:,::-1].astype(np.float32)
	flow, valid = flow[:, :, :2], flow[:, :, 2]
	flow = (flow - 2**15) / 64.0
	return flow, valid

	def readDispKITTI(filename):
	disp = cv2.imread(filename, cv2.IMREAD_ANYDEPTH) / 256.0
	valid = disp > 0.0
	return disp, valid

	def writeDispKITTI(filename, disp):
	disp = np.round(disp * 256).astype(np.uint16)
	# skimage.io.imsave(filename, disp)
	cv2.imwrite(filename, disp)

	def readDispCRES(filename):
	try:
	disp = cv2.imread(filename, cv2.IMREAD_ANYDEPTH).astype(np.float32) / 32.0
	valid = disp > 0.0
	return disp, valid
	except Exception as err:
	raise(Exception(err, "Something wrong with {}".format(filename), os.getcwd()))

	def writeDispCRES(filename, disp):
	disp = np.round(disp * 32).astype(np.uint16)
	# skimage.io.imsave(filename, disp)
	cv2.imwrite(filename, disp)

	def readDispNerfS(filename):
	disp = cv2.imread(filename, cv2.IMREAD_ANYDEPTH).astype(np.float32) / 64.0

	match = re.search(r"(.*?/Q/)", filename)
	if match:
	prefix = match.group(1) # prefix
	suffix = os.path.basename(filename) # file name
	# AO path, aka confidence
	ao_path = f"{prefix}AO/{suffix}"
	# print("AO图路径:", ao_path)
	else:
	raise Exception("corrupted path for NerfStereo: {}".format(filename))
	valid = cv2.imread(ao_path, cv2.IMREAD_ANYDEPTH).astype(np.float32) / 65535
	return disp, valid

	def writeDispNerfS(filename, disp):
	disp = np.round(disp * 64).astype(np.uint16)
	# skimage.io.imsave(filename, disp)
	cv2.imwrite(filename, disp)

	def readDispBooster(file_name):
	disp = np.load(file_name, encoding='bytes', allow_pickle=True)
	# mask_00 = os.path.join(os.path.split(file_name)[0], 'mask_00.png')
	mask_cat_path = os.path.join(os.path.split(file_name)[0], 'mask_cat.png')
	mask_cat = cv2.imread(mask_cat_path, cv2.IMREAD_ANYDEPTH).astype(np.float32)
	valid = mask_cat
	return disp, valid

	def writeDispBooster(filename, disp):
	# disp = np.round(disp).astype(np.uint16)
	# # skimage.io.imsave(filename, disp)
	# filename = filename.replace(".npy", ".jpg")
	# cv2.imwrite(filename, disp)
	np.save(filename, disp)

	# Method taken from /n/fs/raft-depth/RAFT-Stereo/datasets/SintelStereo/sdk/python/sintel_io.py
	def readDispSintelStereo(file_name):
	a = np.array(Image.open(file_name))
	d_r, d_g, d_b = np.split(a, axis=2, indices_or_sections=3)
	disp = (d_r * 4 + d_g / (26) + d_b / (214))[..., 0]
	mask = np.array(Image.open(file_name.replace('disparities', 'occlusions')))
	valid = ((mask == 0) & (disp > 0))
	return disp, valid

	# Method taken from https://research.nvidia.com/sites/default/files/pubs/2018-06_Falling-Things/readme_0.txt
	def readDispFallingThings(file_name):
	a = np.array(Image.open(file_name))
	with open('/'.join(file_name.split('/')[:-1] + ['_camera_settings.json']), 'r') as f:
	intrinsics = json.load(f)
	fx = intrinsics['camera_settings'][0]['intrinsic_settings']['fx']
	disp = (fx * 6.0 * 100) / a.astype(np.float32)
	valid = disp > 0
	return disp, valid

	# Method taken from https://github.com/castacks/tartanair_tools/blob/master/data_type.md
	def readDispTartanAir(file_name):
	depth = np.load(file_name)
	disp = 80.0 / depth
	valid = disp > 0
	return disp, valid


	def readDispMiddlebury(file_name):
	if basename(file_name) == 'disp0GT.pfm':
	disp = readPFM(file_name).astype(np.float32)
	assert len(disp.shape) == 2
	nocc_pix = file_name.replace('disp0GT.pfm', 'mask0nocc.png')
	assert exists(nocc_pix)
	nocc_pix = imageio.imread(nocc_pix) == 255
	assert np.any(nocc_pix)
	return disp, nocc_pix
	elif basename(file_name) == 'disp0.pfm':
	disp = readPFM(file_name).astype(np.float32)
	valid = disp < 1e3
	return disp, valid

	def writeDispMiddlebury(file_name, disp):
	writePFM(file_name, disp)

	def writeFlowKITTI(filename, uv):
	uv = 64.0 * uv + 2**15
	valid = np.ones([uv.shape[0], uv.shape[1], 1])
	uv = np.concatenate([uv, valid], axis=-1).astype(np.uint16)
	cv2.imwrite(filename, uv[..., ::-1])


	def read_gen(file_name, pil=False):
	ext = splitext(file_name)[-1]
	if ext == '.png' or ext == '.jpeg' or ext == '.ppm' or ext == '.jpg':
	return Image.open(file_name)
	elif ext == '.bin' or ext == '.raw':
	return np.load(file_name)
	elif ext == '.flo':
	return readFlow(file_name).astype(np.float32)
	elif ext == '.pfm':
	flow = readPFM(file_name).astype(np.float32)
	if len(flow.shape) == 2:
	return flow
	else:
	return flow[:, :, :-1]
	return []

	def write_gen(file_name, disp, pil=False):
	ext = splitext(file_name)[-1]
	if ext == '.png' or ext == '.jpeg' or ext == '.ppm' or ext == '.jpg':
	raise Exception("no support for {} file".format(ext))
	elif ext == '.bin' or ext == '.raw':
	np.save(disp, file_name)
	elif ext == '.flo':
	writeFlow(file_name, disp)
	elif ext == '.pfm':
	writePFM(file_name, disp)
	else:
	raise Exception("no support for {} file".format(ext))