Spaces:

lambdalabs
/

LambdaSuperRes

Running

LambdaSuperRes / KAIR /data /degradations.py

cooperll

LambdaSuperRes initial commit

2514fb4 over 2 years ago

5.28 kB

	from typing import Tuple

	import numpy as np
	import random
	import torch
	from numpy.typing import NDArray

	from basicsr.data.degradations import random_add_gaussian_noise_pt, random_add_poisson_noise_pt
	from basicsr.data.transforms import paired_random_crop
	from basicsr.utils import DiffJPEG, USMSharp
	from basicsr.utils.img_process_util import filter2D
	from torch import Tensor
	from torch.nn import functional as F


	def blur(img: Tensor, kernel: NDArray) -> Tensor:
	return filter2D(img, kernel)


	def random_resize(
	img: Tensor,
	resize_prob: float,
	resize_range: Tuple[int, int],
	output_scale: float = 1
	) -> Tensor:
	updown_type = random.choices(['up', 'down', 'keep'], resize_prob)[0]
	if updown_type == 'up':
	random_scale = np.random.uniform(1, resize_range[1])
	elif updown_type == 'down':
	random_scale = np.random.uniform(resize_range[0], 1)
	else:
	random_scale = 1
	mode = random.choice(['area', 'bilinear', 'bicubic'])
	out = F.interpolate(img, scale_factor=output_scale * random_scale, mode=mode)
	return out


	def add_noise(
	img: Tensor,
	gray_noise_prob: float,
	gaussian_noise_prob: float,
	noise_range: Tuple[float, float],
	poisson_scale_range: Tuple[float, float]
	) -> Tensor:
	if np.random.uniform() < gaussian_noise_prob:
	img = random_add_gaussian_noise_pt(
	img, sigma_range=noise_range, clip=True, rounds=False,
	gray_prob=gray_noise_prob)
	else:
	img = random_add_poisson_noise_pt(
	img, scale_range=poisson_scale_range,
	gray_prob=gray_noise_prob, clip=True, rounds=False)
	return img


	def jpeg_compression_simulation(
	img: Tensor,
	jpeg_range: Tuple[float, float],
	jpeg_simulator: DiffJPEG
	) -> Tensor:
	jpeg_p = img.new_zeros(img.size(0)).uniform_(*jpeg_range)

	# clamp to [0, 1], otherwise JPEGer will result in unpleasant artifacts
	img = torch.clamp(img, 0, 1)
	return jpeg_simulator(img, quality=jpeg_p)


	@torch.no_grad()
	def apply_real_esrgan_degradations(
	gt: Tensor,
	blur_kernel1: NDArray,
	blur_kernel2: NDArray,
	second_blur_prob: float,
	sinc_kernel: NDArray,
	resize_prob1: float,
	resize_prob2: float,
	resize_range1: Tuple[int, int],
	resize_range2: Tuple[int, int],
	gray_noise_prob1: float,
	gray_noise_prob2: float,
	gaussian_noise_prob1: float,
	gaussian_noise_prob2: float,
	noise_range: Tuple[float, float],
	poisson_scale_range: Tuple[float, float],
	jpeg_compression_range1: Tuple[float, float],
	jpeg_compression_range2: Tuple[float, float],
	jpeg_simulator: DiffJPEG,
	random_crop_gt_size: 512,
	sr_upsample_scale: float,
	usm_sharpener: USMSharp
	):
	"""
	Accept batch from batchloader, and then add two-order degradations
	to obtain LQ images.

	gt: Tensor of shape (B x C x H x W)
	"""
	gt_usm = usm_sharpener(gt)
	# from PIL import Image
	# Image.fromarray((gt_usm[0].permute(1, 2, 0).cpu().numpy() * 255.).astype(np.uint8)).save(
	# "/home/cll/Desktop/GT_USM_orig.png")
	orig_h, orig_w = gt.size()[2:4]

	# ----------------------- The first degradation process ----------------------- #
	out = blur(gt_usm, blur_kernel1)
	out = random_resize(out, resize_prob1, resize_range1)
	out = add_noise(out, gray_noise_prob1, gaussian_noise_prob1, noise_range, poisson_scale_range)
	out = jpeg_compression_simulation(out, jpeg_compression_range1, jpeg_simulator)

	# ----------------------- The second degradation process ----------------------- #
	if np.random.uniform() < second_blur_prob:
	out = blur(out, blur_kernel2)
	out = random_resize(out, resize_prob2, resize_range2, output_scale=(1/sr_upsample_scale))
	out = add_noise(out, gray_noise_prob2, gaussian_noise_prob2,
	noise_range, poisson_scale_range)

	# JPEG compression + the final sinc filter
	# We also need to resize images to desired sizes.
	# We group [resize back + sinc filter] together
	# as one operation.
	# We consider two orders:
	# 1. [resize back + sinc filter] + JPEG compression
	# 2. JPEG compression + [resize back + sinc filter]
	# Empirically, we find other combinations (sinc + JPEG + Resize)
	# will introduce twisted lines.
	if np.random.uniform() < 0.5:
	# resize back + the final sinc filter
	mode = random.choice(['area', 'bilinear', 'bicubic'])
	out = F.interpolate(out, size=(orig_h // sr_upsample_scale,
	orig_w // sr_upsample_scale), mode=mode)
	out = blur(out, sinc_kernel)
	out = jpeg_compression_simulation(out, jpeg_compression_range2, jpeg_simulator)
	else:
	out = jpeg_compression_simulation(out, jpeg_compression_range2, jpeg_simulator)
	mode = random.choice(['area', 'bilinear', 'bicubic'])
	out = F.interpolate(out, size=(orig_h // sr_upsample_scale,
	orig_w // sr_upsample_scale), mode=mode)
	out = blur(out, sinc_kernel)

	# clamp and round
	lq = torch.clamp((out * 255.0).round(), 0, 255) / 255.

	(gt, gt_usm), lq = paired_random_crop([gt, gt_usm], lq, random_crop_gt_size, sr_upsample_scale)

	return gt, gt_usm, lq