NPRC24 / MiAlgo /main_test.py

MiAlgo

82567db verified almost 2 years ago

20.8 kB

	import os

	import multiprocessing as mp
	import numpy as np
	import cv2 as cv
	from tqdm import tqdm

	from glob import glob
	from utils import *

	from grayness_index import GraynessIndex

	import torch
	import torch.nn.functional as F

	from time import time

	from network_raw_denoise import sc_net_1f
	from network import MWRCANv4 as NET
	from classes.fc4.ModelFC4 import ModelFC4

	def load_img(img_path):
	meta_all = {}
	meta_all['img_path'] = img_path

	# load meta
	metadata = json_read(img_path.replace(".png", ".json"), object_hook=fraction_from_json)
	meta_all['meta'] = metadata

	# load image
	img = cv.imread(img_path, cv.IMREAD_UNCHANGED)
	meta_all['img'] = img

	return meta_all




	def pre_process(meta_all):
	img = meta_all['img']

	metadata = meta_all['meta']
	cfa_pattern = metadata['cfa_pattern']
	cfa_pattern_ = ""
	for tt in cfa_pattern:
	if tt == 0:
	cfa_pattern_ += "r"
	elif tt == 1:
	cfa_pattern_ += "g"
	elif tt == 2:
	cfa_pattern_ += "b"
	else:
	raise

	offsets = bayer_to_offsets(cfa_pattern_)
	img = pack_raw_to_4ch(img, offsets)

	if img.shape[0] != 768 and img.shape[1] != 1024:
	img = cv.resize(img, (1024, 768), interpolation=cv.INTER_AREA) # RGB

	bl_fix = np.clip((float(metadata["noise_profile"][0])-0.005) * 1000, 0, 10)
	img = normalize(img, metadata['black_level'], metadata['white_level'], bl_fix).astype(np.float32)

	noise_profile = float(metadata["noise_profile"][0])
	noise_list = [0.00025822882, 0.000580020745, 0.00141667975, 0.00278965863, 0.00347614807]

	if noise_profile < 0.005:
	if noise_profile < noise_list[0]:
	weight1 = noise_profile / noise_list[0]
	final_lsc = lsc_npy[0] * weight1
	linear_idx1, linear_idx2 = 0, 0
	elif noise_profile > noise_list[-1]:
	final_lsc = lsc_npy[-1]
	linear_idx1, linear_idx2 = -1, -1
	else:
	for idx, nn in enumerate(noise_list):
	if noise_profile < nn:
	linear_idx1 = idx - 1
	linear_idx2 = idx
	break

	weight1 = (noise_profile - noise_list[linear_idx1]) / (noise_list[linear_idx2] - noise_list[linear_idx1])
	weight2 = 1-weight1
	final_lsc = lsc_npy[linear_idx1] * weight1 + lsc_npy[linear_idx2] * weight2

	ones = np.ones_like(final_lsc)
	final_lsc = final_lsc * 0.6 + ones * 0.4
	final_lsc[:, :512, :] = final_lsc[:, 1024:511:-1, :]

	img = img * final_lsc

	img = np.clip(img, 0.0, 1.0)
	meta_all["img"] = img

	rgb_gain = metadata['as_shot_neutral']
	ra, ga, ba = rgb_gain
	ra, ga, ba = 1/ra, 1/ga, 1/ba

	meta_all['r_gains'] = [ra]
	meta_all['g_gains'] = [ga]
	meta_all['b_gains'] = [ba]

	return meta_all



	def raw_denoise(results):
	checkpoint_path = "checkpoint/raw_denoise.pth"
	device = torch.device("cuda")
	model = get_net(sc_net_1f, checkpoint_path, device)

	for meta_all in tqdm(results):
	img = meta_all['img']

	img = np.expand_dims(img, axis=0)
	ori_inp = img.copy()

	clip_min = max(np.mean(img)*3, 0.9)
	img = np.clip(img, 0, clip_min)
	img = torch.from_numpy(img.transpose(0, 3, 1, 2)).cuda()

	with torch.no_grad():
	output = model(img)

	output = output.detach().cpu().numpy().transpose(0, 2, 3, 1)

	img = ori_inp + output
	img = np.clip(img, 0, 1)
	img = np.squeeze(img)

	meta_all['img'] = img



	def predict_white_balance(results):
	model = ModelFC4()
	for model_index in [0, 1, 2]:
	path_to_pretrained = os.path.join("./trained_models", "fc4_cwp", "fold_{}".format(model_index))
	model.load(path_to_pretrained)
	model.evaluation_mode()

	for meta_all in tqdm(results):
	img = meta_all['img'].copy()
	img[:, :, 1] = (img[:, :, 1] + img[:, :, 3]) / 2
	img = img[:, :, :-1]

	img = torch.from_numpy(img.transpose(2, 0, 1)).unsqueeze(0).cuda()
	img_tmp = torch.pow(img, 1.0 / 2.2)

	with torch.no_grad():
	pred = model.predict(img_tmp, return_steps=False)
	pred = pred.detach().cpu().squeeze(0).numpy()

	# rgb gain
	r, g, b = pred

	r /= g
	b /= g
	g /= g

	r = 1./ r
	g = 1./ g
	b = 1./ b

	meta_all['r_gains'].append(r)
	meta_all['g_gains'].append(g)
	meta_all['b_gains'].append(b)


	def convert_to_rgb(meta_all):
	img = meta_all['img']
	img[:, :, 1] = (img[:, :, 1] + img[:, :, 3]) / 2
	img = img[:, :, :-1]


	# WB
	r_gains = sorted(meta_all['r_gains'])
	b_gains = sorted(meta_all['b_gains'])

	r_final = (r_gains[0] + r_gains[1] + r_gains[2]) / 3
	g_final = 1
	b_final = (b_gains[1] + b_gains[2] + b_gains[3]) / 3

	img[:, :, 0] *= r_final
	img[:, :, 1] *= g_final
	img[:, :, 2] *= b_final

	img = np.clip(img, 0, 1)


	# CC
	img = apply_color_space_transform(img, color_matrix, color_matrix)


	# convert RGB
	img = transform_xyz_to_srgb(img)


	# shading fix
	if float(meta_all['meta']["noise_profile"][0]) > 0.005:
	lsc_m = lsc ** ((float(meta_all['meta']["noise_profile"][0])-0.005) * 100)
	lsc_inv = 1 / lsc
	lsc_inv = np.mean(lsc_inv, axis=-1, keepdims=True)

	gray = cv.cvtColor(img.astype(np.float32), cv.COLOR_RGB2GRAY)
	gray = gray[:, :, np.newaxis]

	lsc_inv = lsc_inv * np.clip(gray10, 0, 1) np.clip((2 - (float(meta_all['meta']["noise_profile"][0])-0.005) * 100), 1, 2)
	lsc_inv = np.clip(lsc_inv, 0.4, 1)

	img = img * lsc_inv + gray * (1-lsc_inv)
	img = img / lsc_m


	# tonemaping
	img = apply_tone_map(img)


	# gamma
	img = apply_gamma(img).astype(np.float32)
	img = np.clip(img, 0, 1)


	# contrast enhancement
	mm = np.mean(img)
	meta_all['mm'] = mm
	if mm <= 0.1:
	pass
	elif float(meta_all['meta']["noise_profile"][0]) > 0.01:
	yuv = cv.cvtColor(img, cv.COLOR_BGR2YUV)
	y, u, v = cv.split(yuv)
	y = autocontrast_using_pil(y)
	yuv = np.stack([y, u, v], axis=-1)
	rgb = cv.cvtColor(yuv, cv.COLOR_YUV2BGR)
	rgb = np.clip(rgb, 0, 1)

	img = img * 0.5 + rgb * 0.5

	img = np.clip(img*255, 0, 255).round().astype(np.uint8)

	if float(meta_all['meta']["noise_profile"][0]) > 0.02:
	noise_params = 6
	else:
	noise_params = 3

	img = cv.fastNlMeansDenoisingColored(img, None, noise_params, noise_params, 7, 21)
	img = img.astype(np.float32) / 255.

	img = usm_sharp(img)
	else:
	img = autocontrast_using_pil(img)


	# gamma again
	img = np.clip(img, 0, 1)
	img_con = img ** (1/1.5)
	gray = np.max(img_con, axis=-1, keepdims=True) # - 0.1
	gray = np.clip(gray, 0.3, 1)
	img = img_con * gray + img * (1-gray)


	# AWB again
	img = img[:, :, ::-1] # BGR
	gi = GraynessIndex()
	pred_illum = gi.apply(img)
	r, g, b = pred_illum
	pred_illum = pred_illum / g
	r, g, b = pred_illum
	if r < 1:
	img = white_balance(img, pred_illum) # BGR
	img = img[:, :, ::-1]
	img = np.clip(img, 0, 1) # RGB


	# fix orientation
	img = fix_orientation(img, meta_all['meta']["orientation"])

	meta_all['img'] = img # RGB
	return meta_all


	def nn_enhancement(results):
	checkpoint_path1 = "checkpoint/nn_enhance.pth"
	device = torch.device("cuda")
	model = get_net(NET, checkpoint_path1, device)


	for meta_all in tqdm(results):
	# mm = meta_all['mm']
	# if mm <= 0.1 or float(meta_all['meta']["noise_profile"][0]) > 0.01:
	# meta_all['img'] = meta_all['img'] * 255
	# continue

	img = meta_all['img']
	img = img.astype(np.float32)
	img = torch.from_numpy(img.copy().transpose(2, 0, 1)).unsqueeze(0).to(device)

	with torch.no_grad():
	img = model(img)
	# img = img

	img = img.detach().cpu().squeeze(0).numpy().transpose(1, 2, 0)
	img = np.clip(img, 0, 1)

	img = img * 255.
	img = img.round()
	img = img.astype(np.uint8)

	meta_all['img'] = img # RGB U8


	def post_process(meta_all):
	# color fix
	img = meta_all['img'] # RGB U8


	# increase saturation
	increment=0.5
	ori_img = img.copy() # RGB U8

	hls = cv2.cvtColor(img, cv2.COLOR_RGB2HLS).astype(np.float32)
	_, L, S = cv2.split(hls)
	S = S / 255.

	img = img.astype(np.float32)

	temp = increment + S
	mask_2 = temp > 1 # 大于1的位置
	alpha_1 = S
	alpha_2 = 1 - increment
	alpha = alpha_1 * mask_2 + alpha_2 * (1 - mask_2)
	L = L[:, :, np.newaxis]
	alpha = alpha[:, :, np.newaxis]

	alpha = 1/alpha -1

	img = img + (img - L) * alpha

	img = np.clip(img, 0, 255)

	ori_img = ori_img.astype(np.float32)
	mask = ori_img[:, :, 2] / 255.
	# mask = np.max(ori_img, axis=-1) / 255.
	mask = mask[:, :, np.newaxis]
	mask = np.clip(mask - 0.1, 0, 1)
	img = img * mask + ori_img * (1-mask)
	img = np.clip(img, 0, 255).round().astype(np.uint8)



	# decrease saturation
	hsv = cv2.cvtColor(img, cv2.COLOR_RGB2HLS)
	hsv = hsv.astype(np.float32)

	# 绿青
	mmax = 105
	mmin = 40

	alpha = 1 # 越大效果越猛, 误伤越多
	beta = 4 # 越大效果越猛
	gamma = 0.1 # 越小效果越猛

	mid = mmin + ((mmax - mmin) / 2)
	green_weight = np.abs(hsv[:, :, 0] - mid) / ((mmax - mmin)/2)
	green_weight = np.clip(green_weight, 0, 1)
	# green_weight = np.tanh(green_weight/alpha)
	green_weight = green_weight**beta + gamma
	green_weight = np.clip(green_weight, 0, 1)

	green_weight = cv2.blur(green_weight, (11, 11))
	hsv[:, :, 2] = hsv[:, :, 2] * green_weight


	# 紫洋红
	mmax = 180
	mmin = 130

	alpha = 1 # 越大效果越猛, 误伤越多
	beta = 8
	# 越大效果越猛
	gamma = -0.5 # 越小效果越猛

	mid = mmin + ((mmax - mmin) / 2)
	green_weight = np.abs(hsv[:, :, 0] - mid) / ((mmax - mmin)/2)
	green_weight = np.clip(green_weight, 0, 1)
	# green_weight = np.tanh(green_weight/alpha)
	green_weight = (green_weight*beta + gamma) 2
	green_weight = np.clip(green_weight, 0, 1)

	green_weight = cv2.blur(green_weight, (11, 11))
	hsv[:, :, 2] = hsv[:, :, 2] * green_weight


	hsv = np.clip(hsv, 0, 255)
	hsv = hsv.round().astype(np.uint8)

	img = cv2.cvtColor(hsv, cv2.COLOR_HLS2RGB) # RGB U8
	img = np.clip(img, 0, 255)





	img = np.clip(img, 0, 255).round().astype(np.uint8)
	meta_all['img'] = img # RGB U8
	return meta_all



	def sky_enhancement(results):
	model_path = "sky_seg.pt"
	model = torch.load(model_path)
	model.cuda()
	model.eval()

	for meta_all in tqdm(results):
	if float(meta_all['meta']["noise_profile"][0]) >= 0.005:
	continue

	ori_img = meta_all['img'].copy().astype(np.float32) # RGB 0-255 U8

	img = ori_img.copy()
	img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)


	# 天空分割
	scene_image = img.copy().astype(np.float32) # 0-255, bgr


	img = img / 255.
	lab = cv2.cvtColor(img, cv2.COLOR_BGR2LAB)
	# 减少色温
	lab[:,:,1] = lab[:,:,1] - (lab[:,:,2] + 127) * 0.03
	lab[:,:,2] = lab[:,:,2] - (lab[:,:,2] + 127) * 0.1
	# 将图像从LAB空间转换回BGR空间
	img = cv2.cvtColor(lab, cv2.COLOR_LAB2RGB)
	img = img * 255
	img = np.clip(img, 0, 255).round().astype(np.float32)



	img_mean = 0
	img_std = 255.0
	size = (512, 512)
	img_h , img_w = img.shape[:2]

	img = cv2.resize(img, size)
	img = (img - img_mean) / img_std
	img = np.transpose(img, [2, 0, 1])
	img = np.expand_dims(img, axis=0)
	img = torch.from_numpy(img).cuda()

	with torch.no_grad():
	mask = model(img)

	mask = mask.detach().cpu()
	mask = mask.permute((0,3,1,2))
	mask = F.interpolate(mask,
	size=[img_h , img_w],
	mode='bilinear')
	mask = mask[0].permute((1,2,0))
	sky_mask = torch.argmax(mask, axis=2).numpy().astype(np.float32)

	if sky_mask.max() < 0.1:
	continue


	#
	img = ori_img.copy() # RGB
	mask = img[:, :, 2] - np.max(img[:, :, :2], axis=-1)
	mask[sky_mask==0]=0
	a = np.sum(mask)
	b = np.sum(sky_mask)
	ratio_blue = a/b
	# print(meta_all['img_path'], "blue ratio", ratio_blue)

	# 非蓝天
	if ratio_blue < 10:
	img = ori_img.copy()
	mask = np.mean(img[:, :, :2], axis=-1)
	mask[sky_mask==0]=0
	a = np.sum(mask)
	b = np.sum(sky_mask)
	ratio_light = a/b
	# print(meta_all['img_path'], "light ratio", ratio_light)

	# 暗天空，压暗
	if ratio_light<50:
	img = ori_img.copy()
	img = img * 0.88
	img = np.clip(img, 0, 255) # RGB
	# 中等亮度，提亮
	elif ratio_light < 200:
	img = ori_img.copy()
	img = img * 1.1
	img = np.clip(img, 0, 255) # RGB
	else:
	pass

	hsv = cv2.cvtColor(img.astype(np.uint8), cv2.COLOR_RGB2HSV).astype(np.float32)
	hsv[:, :, 1] = hsv[:, :, 1]* 0.4
	hsv = np.clip(hsv, 0, 255).astype(np.uint8)
	img = cv2.cvtColor(hsv, cv2.COLOR_HSV2RGB).astype(np.float32)

	# 蓝天
	else:
	# LAB
	img = ori_img.copy()
	img = img / 255.
	lab = cv2.cvtColor(img, cv2.COLOR_RGB2LAB)

	# 减少色温
	lab[:,:,1] = lab[:,:,1] - (lab[:,:,2] + 127) * 0.03
	lab[:,:,2] = lab[:,:,2] - (lab[:,:,2] + 127) * 0.1

	# 将图像从LAB空间转换回BGR空间
	img = cv2.cvtColor(lab, cv2.COLOR_LAB2RGB)

	img = img * 255
	img = np.clip(img, 0, 255).round().astype(np.float32)


	sky_image = img.copy().astype(np.float32) # 0-255, RGB
	sky_image = cv2.cvtColor(sky_image, cv2.COLOR_RGB2BGR) # BGR 0-255 F32

	sky_mask_ori = sky_mask.copy()
	kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (11, 11))
	sky_mask_ori = cv2.erode(sky_mask_ori, kernel)

	sky_mask_ori = sky_mask_ori > 0.9

	if np.sum(sky_mask_ori) > 0:
	h, w = sky_mask.shape

	sky_mask = cv2.resize(sky_mask, None, fx=0.1, fy=0.1, interpolation=cv2.INTER_NEAREST)
	kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (5, 5))
	sky_mask = cv2.dilate(sky_mask, kernel)
	sky_mask_blur = cv2.blur(sky_mask, (21, 21))
	sky_mask_blur[sky_mask>0.5] = sky_mask[sky_mask>0.5]
	sky_mask = sky_mask_blur
	sky_mask = cv2.resize(sky_mask, (w, h), interpolation=cv2.INTER_LINEAR)
	sky_mask = np.clip(sky_mask, 0.1, 1)

	sky_area_img = np.zeros_like(sky_image)
	sky_area_img[sky_mask_ori] = sky_image[sky_mask_ori]
	sky_area_img = cv2.cvtColor(sky_area_img, cv2.COLOR_BGR2GRAY)

	sky_area_img_mean = np.sum(sky_area_img) / np.sum(sky_mask_ori)
	if sky_area_img_mean > 20:
	res = pyrblend(scene_image, sky_image, sky_mask)
	res = np.clip(res, 0, 255) # 0-255, bgr

	res = res.round().astype(np.uint8)
	res = cv2.cvtColor(res, cv2.COLOR_BGR2RGB) # RGB 0-255 U8
	meta_all['img'] = res



	def post_process2(meta_all):
	# PIL
	img = meta_all['img'].copy() # RGB U8

	img = img.astype(np.float32) / 255.

	yuv = cv.cvtColor(img, cv.COLOR_RGB2YUV)
	y, u, v = cv.split(yuv)
	y = autocontrast_using_pil(y)
	yuv = np.stack([y, u, v], axis=-1)
	rgb = cv.cvtColor(yuv, cv.COLOR_YUV2RGB)
	rgb = np.clip(rgb, 0, 1)

	img = rgb

	img = np.clip(img*255, 0, 255)# .round().astype(np.uint8) # RGB


	ori_img = meta_all['img'].copy().astype(np.float32)
	mask = np.mean(ori_img, axis=-1) / 255.
	mask = mask[:, :, np.newaxis]
	mask = np.clip(mask - 0.1, 0, 1)
	img = img * mask + ori_img * (1-mask)
	img = np.clip(img, 0, 255)

	img = img.round().astype(np.uint8)
	meta_all['img'] = img

	return meta_all


	def save_jpg(meta_all):
	img = meta_all['img'] # RGB U8
	out_path = os.path.join(output_path, meta_all['img_path'].split("/")[-1].split(".")[0] + ".jpg")

	cv.imwrite(out_path, img[:, :, ::-1], [cv.IMWRITE_JPEG_QUALITY, 100])



	if __name__ == "__main__":
	num_worker = 4

	all_time = time()

	input_path = "/data"
	output_path = "/data"
	# input_path = "/ssd/ntire24/nightrender/data/data"
	# output_path = "/ssd/ntire24/nightrender/data/data"
	os.makedirs(output_path, exist_ok=True)


	# load img
	s_time = time()
	input_list = sorted(glob(os.path.join(input_path, "*.png")))# [:4]

	if num_worker > 1:
	with mp.Pool(num_worker) as pool:
	results = list(tqdm(pool.imap(load_img, input_list), total=len(input_list)))
	else:
	results = []
	for p in tqdm(input_list):
	results.append(load_img(p))
	load_time = time()-s_time
	print("load_img time is: ", load_time)


	# preprocess
	s_time = time()
	iso_list = [50, 125, 320, 640, 800]
	lsc_npy = [np.load("./lsc_npy/{}.npy".format(iso)) for iso in iso_list]

	if num_worker > 1:
	with mp.Pool(num_worker) as pool:
	results = list(tqdm(pool.imap(pre_process, results), total=len(results)))
	else:
	for r in tqdm(results):
	r = pre_process(r)
	del lsc_npy
	print("pre_process time is: ", time()-s_time)


	# raw denoise
	s_time = time()
	raw_denoise(results)
	print("raw_denoise time is: ", time()-s_time)


	# awb
	s_time = time()
	predict_white_balance(results)
	print("predict_white_balance time is: ", time()-s_time)


	# convert
	s_time = time()
	color_matrix = [1.06835938, -0.29882812, -0.14257812, -0.43164062, 1.35546875, 0.05078125, -0.1015625, 0.24414062, 0.5859375]
	lsc = np.load("lsc.npy")
	if num_worker > 1:
	with mp.Pool(num_worker) as pool:
	results = list(tqdm(pool.imap(convert_to_rgb, results), total=len(results)))
	else:
	for r in tqdm(results):
	r = convert_to_rgb(r)
	del lsc
	print("convert_to_rgb time is: ", time()-s_time)


	# NN_enhancement
	s_time = time()
	nn_enhancement(results)
	print("nn_enhancement time is: ", time()-s_time)



	# colorfix & sat enhance
	s_time = time()
	kernel = cv.getStructuringElement(cv.MORPH_RECT, (5, 5))
	if num_worker > 1:
	with mp.Pool(num_worker) as pool:
	results = list(tqdm(pool.imap(post_process, results), total=len(results)))
	else:
	for r in tqdm(results):
	r = post_process(r)
	print("post_process time is: ", time()-s_time)



	# sky_enhancement
	s_time = time()
	sky_enhancement(results)
	print("sky_enhancement time is: ", time()-s_time)



	# PIL autocontrast
	s_time = time()
	if num_worker > 1:
	with mp.Pool(num_worker) as pool:
	results = list(tqdm(pool.imap(post_process2, results), total=len(results)))
	else:
	for r in tqdm(results):
	r = post_process2(r)
	print("post_process2 time is: ", time()-s_time)



	# save jpg
	s_time = time()
	if num_worker > 1:
	with mp.Pool(num_worker) as pool:
	_ = list(tqdm(pool.imap(save_jpg, results), total=len(results)))
	else:
	for r in tqdm(results):
	save_jpg(r)
	save_time = time()-s_time
	print("save_jpg time is: ", save_time)


	total_time = time()-all_time
	total_time_without_load_save = total_time - load_time - save_time
	print("per image inference time (without load and save) is: ", total_time_without_load_save / len(results), "s")