Spaces:

ysheng
/

SSN-Soft-Shadow-Network-for-Image-Composition

Runtime error

App Files Files Community

SSN-Soft-Shadow-Network-for-Image-Composition / models /Loss /Loss.py

yichen-purdue

init

34fb220 about 1 year ago

raw

history blame

8.23 kB

	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	import torchvision.transforms as T
	from torch.autograd import Variable

	import numpy as np
	import cv2

	# from vgg19_loss import VGG19Loss
	# import pytorch_ssim

	from .vgg19_loss import VGG19Loss
	from . import pytorch_ssim
	from abc import ABC, abstractmethod
	from collections import OrderedDict

	class abs_loss(ABC):
	def loss(self, gt_img, pred_img):
	pass


	class norm_loss(abs_loss):
	def __init__(self, norm=1):
	self.norm = norm


	def loss(self, gt_img, pred_img):
	""" M * (I-I') """
	b, c, h, w = gt_img.shape
	return torch.norm(gt_img-pred_img, self.norm)/(h * w * b)



	class ssim_loss(abs_loss):
	def __init__(self, window_size=11, channel=1):
	""" Let's try mean ssim!
	"""
	self.channel = channel
	self.window_size = window_size
	self.window = self.create_mean_window(window_size, channel)


	def loss(self, gt_img, pred_img):
	b, c, h, w = gt_img.shape
	if c != self.channel:
	self.channel = c
	self.window = self.create_mean_window(self.window_size, self.channel)

	self.window = self.window.to(gt_img).type_as(gt_img)
	l = 1.0 - self.ssim_compute(gt_img, pred_img)
	return l


	def create_mean_window(self, window_size, channel):
	window = Variable(torch.ones(channel, 1, window_size, window_size).float())
	window = window/(window_size * window_size)
	return window


	def ssim_compute(self, gt_img, pred_img):
	window = self.window
	window_size = self.window_size
	channel = self.channel

	mu1 = F.conv2d(gt_img, window, padding = window_size//2, groups = channel)
	mu2 = F.conv2d(pred_img, window, padding = window_size//2, groups = channel)

	mu1_sq = mu1.pow(2)
	mu2_sq = mu2.pow(2)
	mu1_mu2 = mu1*mu2

	sigma1_sq = F.conv2d(gt_img*gt_img, window, padding = window_size//2, groups = channel) - mu1_sq
	sigma2_sq = F.conv2d(pred_img*pred_img, window, padding = window_size//2, groups = channel) - mu2_sq
	sigma12 = F.conv2d(gt_img*pred_img, window, padding = window_size//2, groups = channel) - mu1_mu2

	C1 = 0.01**2
	C2 = 0.03**2

	ssim_map = ((2mu1_mu2 + C1)(2sigma12 + C2))/((mu1_sq + mu2_sq + C1)(sigma1_sq + sigma2_sq + C2))

	return ssim_map.mean()


	class hierarchical_ssim_loss(abs_loss):
	def __init__(self, patch_list: list):
	self.ssim_loss_list = [pytorch_ssim.SSIM(window_size=ws) for ws in patch_list]


	def loss(self, gt_img, pred_img):
	b, c, h, w = gt_img.shape
	total_loss = 0.0
	for loss_func in self.ssim_loss_list:
	total_loss += (1.0-loss_func(gt_img, pred_img))

	return total_loss/b


	class vgg_loss(abs_loss):
	def __init__(self):
	self.vgg19_ = VGG19Loss()


	def loss(self, gt_img, pred_img):
	b, c, h, w = gt_img.shape
	v = self.vgg19_(gt_img, pred_img, pred_img.device)
	return v/b


	class grad_loss(abs_loss):
	def __init__(self, k=4):
	self.k = 4

	def loss(self, disp_img, rgb_img=None):
	""" Note, gradient loss should be weighted by an edge-aware weight
	"""
	b, c, h, w = disp_img.shape

	grad_loss = 0.0
	for i in range(self.k):
	div_factor = 2 ** i
	cur_transform = T.Resize([h // div_factor, ])
	# cur_diff = cur_transform(diff)
	# cur_diff_dx, cur_diff_dy = self.img_grad(cur_diff)
	cur_disp = cur_transform(disp_img)

	cur_disp_dx, cur_disp_dy = self.img_grad(cur_disp)

	if rgb_img is not None:
	cur_rgb = cur_transform(rgb_img)
	cur_rgb_dx, cur_rgb_dy = self.img_grad(cur_rgb)

	cur_rgb_dx = torch.exp(-torch.mean(torch.abs(cur_rgb_dx), dim=1, keepdims=True))
	cur_rgb_dy = torch.exp(-torch.mean(torch.abs(cur_rgb_dy), dim=1, keepdims=True))
	grad_loss += (torch.sum(torch.abs(cur_disp_dx) * cur_rgb_dx) + torch.sum(torch.abs(cur_disp_dy) * cur_rgb_dy)) / (h * w * self.k)
	else:
	grad_loss += (torch.sum(torch.abs(cur_disp_dx)) + torch.sum(torch.abs(cur_disp_dy))) / (h * w * self.k)

	return grad_loss/b


	def gloss(self, gt, pred):
	""" Loss on the gradient domain
	"""
	b, c, h, w = gt.shape
	gt_dx, gt_dy = self.img_grad(gt)
	pred_dx, pred_dy = self.img_grad(pred)

	loss = (gt_dx-pred_dx) 2 + (gt_dy - pred_dy) 2
	return loss.sum()/(b * h * w)


	def laploss(self, pred):
	b, c, h, w = pred.shape
	lap = self.img_laplacian(pred)

	return torch.abs(lap).sum()/(b * h * w)


	def img_laplacian(self, img):
	b, c, h, w = img.shape
	laplacian = torch.tensor([[1, 4, 1], [4, -20, 4], [1, 4, 1]])

	laplacian_kernel = laplacian.float().unsqueeze(0).expand(1, c, 3, 3).to(img)

	lap = F.conv2d(img, laplacian_kernel, padding=1, stride=1)
	return lap


	def img_grad(self, img):
	""" Comptue image gradient by sobel filtering
	img: B x C x H x W
	"""

	b, c, h, w = img.shape
	ysobel = torch.tensor([[1, 2, 1], [0, 0, 0], [-1, -2, -1]])
	xsobel = ysobel.transpose(0,1)

	xsobel_kernel = xsobel.float().unsqueeze(0).expand(1, c, 3, 3).to(img)
	ysobel_kernel = ysobel.float().unsqueeze(0).expand(1, c, 3, 3).to(img)
	dx = F.conv2d(img, xsobel_kernel, padding=1, stride=1)
	dy = F.conv2d(img, ysobel_kernel, padding=1, stride=1)

	return dx, dy



	class sharp_loss(abs_loss):
	""" Sharpness term
	1. laplacian
	2. image contrast
	3. image variance
	"""
	def __init__(self, window_size=11, channel=1):
	self.window_size = window_size
	self.channel = channel
	self.window = self.create_mean_window(window_size, self.channel)


	def loss(self, gt_img, pred_img):
	""" Note, gradient loss should be weighted by an edge-aware weight
	"""
	b, c, h, w = gt_img.shape

	if c != self.channel:
	self.channel = c
	self.window = self.create_mean_window(self.window_size, self.channel)

	self.window = self.window.to(gt_img).type_as(gt_img)

	channel = self.channel
	window = self.window
	window_size = self.window_size

	mu1 = F.conv2d(gt_img, window, padding = window_size//2, groups = channel) + 1e-6
	mu2 = F.conv2d(pred_img, window, padding = window_size//2, groups = channel) + 1e-6

	constrast1 = torch.absolute((gt_img - mu1)/mu1)
	constrast2 = torch.absolute((pred_img - mu2)/mu2)

	variance1 = (gt_img-mu1) ** 2
	variance2 = (pred_img-mu2) ** 2

	laplacian1 = self.img_laplacian(gt_img)
	laplacian2 = self.img_laplacian(pred_img)

	S1 = -laplacian1 - constrast1 - variance1
	S2 = -laplacian2 - constrast2 - variance2

	# import pdb; pdb.set_trace()
	total = torch.absolute(S1-S2).mean()
	return total


	def img_laplacian(self, img):
	b, c, h, w = img.shape
	laplacian = torch.tensor([[1, 4, 1], [4, -20, 4], [1, 4, 1]])

	laplacian_kernel = laplacian.float().unsqueeze(0).expand(1, c, 3, 3).to(img)

	lap = F.conv2d(img, laplacian_kernel, padding=1, stride=1)
	return lap


	def create_mean_window(self, window_size, channel):
	window = Variable(torch.ones(channel, 1, window_size, window_size).float())
	window = window/(window_size * window_size)
	return window


	if __name__ == '__main__':
	a = torch.rand(3,3,128,128)
	b = torch.rand(3,3,128,128)

	ssim = ssim_loss()
	loss = ssim.loss(a, b)
	print(loss.shape, loss)

	loss = ssim.loss(a, a)
	print(loss.shape, loss)

	loss = ssim.loss(b, b)
	print(loss.shape, loss)

	grad = grad_loss()
	loss = grad.loss(a, [b, b])
	print(loss.shape, loss)

	sharp = sharp_loss()
	loss = sharp.loss(a, b)
	print(loss.shape, loss)