2020-08-22 14:24:34 +00:00
|
|
|
import torch
|
|
|
|
import torch.nn as nn
|
2020-10-22 20:39:19 +00:00
|
|
|
from torch.cuda.amp import autocast
|
|
|
|
|
2020-08-22 14:24:34 +00:00
|
|
|
from models.networks import define_F
|
|
|
|
from models.loss import GANLoss
|
2020-09-27 03:25:32 +00:00
|
|
|
import random
|
|
|
|
import functools
|
2020-11-12 22:42:05 +00:00
|
|
|
import torch.nn.functional as F
|
|
|
|
import numpy as np
|
2020-08-22 14:24:34 +00:00
|
|
|
|
|
|
|
|
2020-09-29 04:09:42 +00:00
|
|
|
def create_loss(opt_loss, env):
|
2020-08-22 14:24:34 +00:00
|
|
|
type = opt_loss['type']
|
2020-10-06 01:35:28 +00:00
|
|
|
if 'teco_' in type:
|
|
|
|
from models.steps.tecogan_losses import create_teco_loss
|
|
|
|
return create_teco_loss(opt_loss, env)
|
|
|
|
elif type == 'pix':
|
2020-08-22 14:24:34 +00:00
|
|
|
return PixLoss(opt_loss, env)
|
2020-11-03 15:09:58 +00:00
|
|
|
elif type == 'direct':
|
|
|
|
return DirectLoss(opt_loss, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
elif type == 'feature':
|
|
|
|
return FeatureLoss(opt_loss, env)
|
2020-09-02 16:08:24 +00:00
|
|
|
elif type == 'interpreted_feature':
|
|
|
|
return InterpretedFeatureLoss(opt_loss, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
elif type == 'generator_gan':
|
|
|
|
return GeneratorGanLoss(opt_loss, env)
|
|
|
|
elif type == 'discriminator_gan':
|
|
|
|
return DiscriminatorGanLoss(opt_loss, env)
|
2020-09-20 22:24:23 +00:00
|
|
|
elif type == 'geometric':
|
|
|
|
return GeometricSimilarityGeneratorLoss(opt_loss, env)
|
2020-09-27 03:25:32 +00:00
|
|
|
elif type == 'translational':
|
|
|
|
return TranslationInvarianceLoss(opt_loss, env)
|
2020-10-05 02:48:15 +00:00
|
|
|
elif type == 'recursive':
|
|
|
|
return RecursiveInvarianceLoss(opt_loss, env)
|
2020-10-07 15:03:30 +00:00
|
|
|
elif type == 'recurrent':
|
|
|
|
return RecurrentLoss(opt_loss, env)
|
2020-10-10 01:51:44 +00:00
|
|
|
elif type == 'for_element':
|
|
|
|
return ForElementLoss(opt_loss, env)
|
2020-11-12 22:42:05 +00:00
|
|
|
elif type == 'stylegan2_divergence':
|
|
|
|
return StyleGan2DivergenceLoss(opt_loss, env)
|
|
|
|
elif type == 'stylegan2_pathlen':
|
|
|
|
return StyleGan2PathLengthLoss(opt_loss, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
else:
|
|
|
|
raise NotImplementedError
|
|
|
|
|
|
|
|
|
2020-09-11 03:35:29 +00:00
|
|
|
# Converts params to a list of tensors extracted from state. Works with list/tuple params as well as scalars.
|
2020-10-18 04:54:12 +00:00
|
|
|
def extract_params_from_state(params: object, state: object, root: object = True) -> object:
|
2020-09-11 03:35:29 +00:00
|
|
|
if isinstance(params, list) or isinstance(params, tuple):
|
2020-10-03 02:40:13 +00:00
|
|
|
p = [extract_params_from_state(r, state, False) for r in params]
|
|
|
|
elif isinstance(params, str):
|
2020-10-22 19:27:32 +00:00
|
|
|
if params == 'None':
|
|
|
|
p = None
|
|
|
|
else:
|
|
|
|
p = state[params]
|
2020-09-11 03:35:29 +00:00
|
|
|
else:
|
2020-10-03 02:40:13 +00:00
|
|
|
p = params
|
|
|
|
# The root return must always be a list.
|
|
|
|
if root and not isinstance(p, list):
|
|
|
|
p = [p]
|
2020-09-11 03:35:29 +00:00
|
|
|
return p
|
|
|
|
|
|
|
|
|
2020-08-22 14:24:34 +00:00
|
|
|
class ConfigurableLoss(nn.Module):
|
|
|
|
def __init__(self, opt, env):
|
2020-08-22 19:08:33 +00:00
|
|
|
super(ConfigurableLoss, self).__init__()
|
2020-08-22 14:24:34 +00:00
|
|
|
self.opt = opt
|
|
|
|
self.env = env
|
2020-08-23 23:22:34 +00:00
|
|
|
self.metrics = []
|
2020-08-22 14:24:34 +00:00
|
|
|
|
2020-09-12 04:57:06 +00:00
|
|
|
# net is either a scalar network being trained or a list of networks being trained, depending on the configuration.
|
2020-08-22 14:24:34 +00:00
|
|
|
def forward(self, net, state):
|
|
|
|
raise NotImplementedError
|
|
|
|
|
2020-08-23 23:22:34 +00:00
|
|
|
def extra_metrics(self):
|
|
|
|
return self.metrics
|
|
|
|
|
2020-10-13 16:07:49 +00:00
|
|
|
def clear_metrics(self):
|
|
|
|
self.metrics = []
|
|
|
|
|
2020-08-22 14:24:34 +00:00
|
|
|
|
|
|
|
def get_basic_criterion_for_name(name, device):
|
|
|
|
if name == 'l1':
|
2020-08-22 19:08:33 +00:00
|
|
|
return nn.L1Loss().to(device)
|
2020-08-22 14:24:34 +00:00
|
|
|
elif name == 'l2':
|
2020-08-22 19:08:33 +00:00
|
|
|
return nn.MSELoss().to(device)
|
2020-09-22 23:10:29 +00:00
|
|
|
elif name == 'cosine':
|
|
|
|
return nn.CosineEmbeddingLoss().to(device)
|
2020-08-22 14:24:34 +00:00
|
|
|
else:
|
|
|
|
raise NotImplementedError
|
|
|
|
|
|
|
|
|
|
|
|
class PixLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
2020-08-22 19:08:33 +00:00
|
|
|
super(PixLoss, self).__init__(opt, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
self.opt = opt
|
|
|
|
self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
|
2020-11-03 15:09:58 +00:00
|
|
|
self.real_scale = opt['real_scale'] if 'real_scale' in opt.keys() else 1
|
|
|
|
self.real_offset = opt['real_offset'] if 'real_offset' in opt.keys() else 0
|
|
|
|
self.report_metrics = opt['report_metrics'] if 'report_metrics' in opt.keys() else False
|
2020-08-22 14:24:34 +00:00
|
|
|
|
2020-09-12 04:57:06 +00:00
|
|
|
def forward(self, _, state):
|
2020-11-03 15:09:58 +00:00
|
|
|
real = state[self.opt['real']] * self.real_scale + float(self.real_offset)
|
|
|
|
fake = state[self.opt['fake']]
|
|
|
|
if self.report_metrics:
|
|
|
|
self.metrics.append(("real_pix_mean_histogram", torch.mean(real, dim=[1,2,3]).detach()))
|
|
|
|
self.metrics.append(("fake_pix_mean_histogram", torch.mean(fake, dim=[1,2,3]).detach()))
|
|
|
|
self.metrics.append(("real_pix_std", torch.std(real).detach()))
|
|
|
|
self.metrics.append(("fake_pix_std", torch.std(fake).detach()))
|
|
|
|
return self.criterion(fake.float(), real.float())
|
|
|
|
|
|
|
|
|
|
|
|
# Loss defined by averaging the input tensor across all dimensions an optionally inverting it.
|
|
|
|
class DirectLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(DirectLoss, self).__init__(opt, env)
|
|
|
|
self.opt = opt
|
|
|
|
self.inverted = opt['inverted'] if 'inverted' in opt.keys() else False
|
|
|
|
self.key = opt['key']
|
|
|
|
|
|
|
|
def forward(self, _, state):
|
|
|
|
if self.inverted:
|
|
|
|
return -torch.mean(state[self.key])
|
|
|
|
else:
|
|
|
|
return torch.mean(state[self.key])
|
2020-08-22 14:24:34 +00:00
|
|
|
|
|
|
|
|
|
|
|
class FeatureLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
2020-08-22 19:08:33 +00:00
|
|
|
super(FeatureLoss, self).__init__(opt, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
self.opt = opt
|
|
|
|
self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
|
2020-09-02 16:08:24 +00:00
|
|
|
self.netF = define_F(which_model=opt['which_model_F'],
|
|
|
|
load_path=opt['load_path'] if 'load_path' in opt.keys() else None).to(self.env['device'])
|
2020-08-23 23:22:34 +00:00
|
|
|
if not env['opt']['dist']:
|
2020-11-14 03:05:52 +00:00
|
|
|
self.netF = torch.nn.parallel.DataParallel(self.netF, device_ids=env['opt']['gpu_ids'])
|
2020-08-22 14:24:34 +00:00
|
|
|
|
2020-09-12 04:57:06 +00:00
|
|
|
def forward(self, _, state):
|
2020-10-22 22:49:34 +00:00
|
|
|
with autocast(enabled=self.env['opt']['fp16']):
|
|
|
|
with torch.no_grad():
|
|
|
|
logits_real = self.netF(state[self.opt['real']])
|
|
|
|
logits_fake = self.netF(state[self.opt['fake']])
|
2020-09-22 23:10:29 +00:00
|
|
|
if self.opt['criterion'] == 'cosine':
|
2020-10-22 22:49:34 +00:00
|
|
|
return self.criterion(logits_fake.float(), logits_real.float(), torch.ones(1, device=logits_fake.device))
|
2020-09-22 23:10:29 +00:00
|
|
|
else:
|
2020-10-22 22:49:34 +00:00
|
|
|
return self.criterion(logits_fake.float(), logits_real.float())
|
2020-08-22 14:24:34 +00:00
|
|
|
|
|
|
|
|
2020-09-02 16:08:24 +00:00
|
|
|
# Special form of feature loss which first computes the feature embedding for the truth space, then uses a second
|
|
|
|
# network which was trained to replicate that embedding on an altered input space (for example, LR or greyscale) to
|
|
|
|
# compute the embedding in the generated space. Useful for weakening the influence of the feature network in controlled
|
|
|
|
# ways.
|
|
|
|
class InterpretedFeatureLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(InterpretedFeatureLoss, self).__init__(opt, env)
|
|
|
|
self.opt = opt
|
|
|
|
self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
|
|
|
|
self.netF_real = define_F(which_model=opt['which_model_F']).to(self.env['device'])
|
|
|
|
self.netF_gen = define_F(which_model=opt['which_model_F'], load_path=opt['load_path']).to(self.env['device'])
|
|
|
|
if not env['opt']['dist']:
|
|
|
|
self.netF_real = torch.nn.parallel.DataParallel(self.netF_real)
|
|
|
|
self.netF_gen = torch.nn.parallel.DataParallel(self.netF_gen)
|
|
|
|
|
2020-09-12 04:57:06 +00:00
|
|
|
def forward(self, _, state):
|
2020-09-03 17:32:47 +00:00
|
|
|
logits_real = self.netF_real(state[self.opt['real']])
|
2020-09-02 16:08:24 +00:00
|
|
|
logits_fake = self.netF_gen(state[self.opt['fake']])
|
2020-10-22 22:49:34 +00:00
|
|
|
return self.criterion(logits_fake.float(), logits_real.float())
|
2020-09-02 16:08:24 +00:00
|
|
|
|
|
|
|
|
2020-08-22 14:24:34 +00:00
|
|
|
class GeneratorGanLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
2020-08-22 19:08:33 +00:00
|
|
|
super(GeneratorGanLoss, self).__init__(opt, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
self.opt = opt
|
|
|
|
self.criterion = GANLoss(opt['gan_type'], 1.0, 0.0).to(env['device'])
|
2020-09-23 17:56:36 +00:00
|
|
|
self.noise = None if 'noise' not in opt.keys() else opt['noise']
|
|
|
|
self.detach_real = opt['detach_real'] if 'detach_real' in opt.keys() else True
|
2020-10-03 04:53:42 +00:00
|
|
|
# This is a mechanism to prevent backpropagation for a GAN loss if it goes too low. This can be used to balance
|
|
|
|
# generators and discriminators by essentially having them skip steps while their counterparts "catch up".
|
|
|
|
self.min_loss = opt['min_loss'] if 'min_loss' in opt.keys() else 0
|
2020-10-18 16:22:10 +00:00
|
|
|
if self.min_loss != 0:
|
|
|
|
self.loss_rotating_buffer = torch.zeros(10, requires_grad=False)
|
|
|
|
self.rb_ptr = 0
|
|
|
|
self.losses_computed = 0
|
2020-08-22 14:24:34 +00:00
|
|
|
|
2020-09-12 04:57:06 +00:00
|
|
|
def forward(self, _, state):
|
2020-08-23 23:22:34 +00:00
|
|
|
netD = self.env['discriminators'][self.opt['discriminator']]
|
2020-09-23 17:56:36 +00:00
|
|
|
real = extract_params_from_state(self.opt['real'], state)
|
2020-09-11 03:35:29 +00:00
|
|
|
fake = extract_params_from_state(self.opt['fake'], state)
|
2020-09-23 17:56:36 +00:00
|
|
|
if self.noise:
|
|
|
|
nreal = []
|
|
|
|
nfake = []
|
|
|
|
for i, t in enumerate(real):
|
|
|
|
if isinstance(t, torch.Tensor):
|
|
|
|
nreal.append(t + torch.randn_like(t) * self.noise)
|
|
|
|
nfake.append(fake[i] + torch.randn_like(t) * self.noise)
|
|
|
|
else:
|
|
|
|
nreal.append(t)
|
|
|
|
nfake.append(fake[i])
|
|
|
|
real = nreal
|
|
|
|
fake = nfake
|
2020-10-22 20:39:19 +00:00
|
|
|
with autocast(enabled=self.env['opt']['fp16']):
|
|
|
|
if self.opt['gan_type'] in ['gan', 'pixgan', 'pixgan_fea']:
|
|
|
|
pred_g_fake = netD(*fake)
|
|
|
|
loss = self.criterion(pred_g_fake, True)
|
|
|
|
elif self.opt['gan_type'] == 'ragan':
|
|
|
|
pred_d_real = netD(*real)
|
|
|
|
if self.detach_real:
|
|
|
|
pred_d_real = pred_d_real.detach()
|
|
|
|
pred_g_fake = netD(*fake)
|
2020-11-02 15:45:46 +00:00
|
|
|
d_fake_diff = pred_g_fake - torch.mean(pred_d_real)
|
2020-11-10 23:09:17 +00:00
|
|
|
self.metrics.append(("d_fake", torch.mean(pred_g_fake)))
|
2020-10-22 20:39:19 +00:00
|
|
|
self.metrics.append(("d_fake_diff", torch.mean(d_fake_diff)))
|
|
|
|
loss = (self.criterion(pred_d_real - torch.mean(pred_g_fake), False) +
|
2020-11-02 15:45:46 +00:00
|
|
|
self.criterion(d_fake_diff, True)) / 2
|
2020-10-22 20:39:19 +00:00
|
|
|
else:
|
|
|
|
raise NotImplementedError
|
2020-10-18 16:22:10 +00:00
|
|
|
if self.min_loss != 0:
|
|
|
|
self.loss_rotating_buffer[self.rb_ptr] = loss.item()
|
|
|
|
self.rb_ptr = (self.rb_ptr + 1) % self.loss_rotating_buffer.shape[0]
|
|
|
|
if torch.mean(self.loss_rotating_buffer) < self.min_loss:
|
|
|
|
return 0
|
|
|
|
self.losses_computed += 1
|
|
|
|
self.metrics.append(("loss_counter", self.losses_computed))
|
2020-10-03 04:53:42 +00:00
|
|
|
return loss
|
2020-08-22 14:24:34 +00:00
|
|
|
|
|
|
|
|
|
|
|
class DiscriminatorGanLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
2020-08-22 19:08:33 +00:00
|
|
|
super(DiscriminatorGanLoss, self).__init__(opt, env)
|
2020-08-22 14:24:34 +00:00
|
|
|
self.opt = opt
|
|
|
|
self.criterion = GANLoss(opt['gan_type'], 1.0, 0.0).to(env['device'])
|
2020-09-20 03:47:52 +00:00
|
|
|
self.noise = None if 'noise' not in opt.keys() else opt['noise']
|
2020-10-03 04:53:42 +00:00
|
|
|
# This is a mechanism to prevent backpropagation for a GAN loss if it goes too low. This can be used to balance
|
|
|
|
# generators and discriminators by essentially having them skip steps while their counterparts "catch up".
|
|
|
|
self.min_loss = opt['min_loss'] if 'min_loss' in opt.keys() else 0
|
2020-10-18 16:22:10 +00:00
|
|
|
if self.min_loss != 0:
|
2020-10-28 03:08:59 +00:00
|
|
|
assert not self.env['dist'] # distributed training does not support 'min_loss' - it can result in backward() desync by design.
|
2020-10-18 16:22:10 +00:00
|
|
|
self.loss_rotating_buffer = torch.zeros(10, requires_grad=False)
|
|
|
|
self.rb_ptr = 0
|
|
|
|
self.losses_computed = 0
|
2020-08-22 14:24:34 +00:00
|
|
|
|
|
|
|
def forward(self, net, state):
|
2020-09-11 03:35:29 +00:00
|
|
|
real = extract_params_from_state(self.opt['real'], state)
|
2020-09-23 17:56:36 +00:00
|
|
|
real = [r.detach() for r in real]
|
2020-09-11 03:35:29 +00:00
|
|
|
fake = extract_params_from_state(self.opt['fake'], state)
|
|
|
|
fake = [f.detach() for f in fake]
|
2020-09-20 03:47:52 +00:00
|
|
|
if self.noise:
|
2020-09-20 18:00:27 +00:00
|
|
|
nreal = []
|
|
|
|
nfake = []
|
|
|
|
for i, t in enumerate(real):
|
|
|
|
if isinstance(t, torch.Tensor):
|
|
|
|
nreal.append(t + torch.randn_like(t) * self.noise)
|
|
|
|
nfake.append(fake[i] + torch.randn_like(t) * self.noise)
|
|
|
|
else:
|
|
|
|
nreal.append(t)
|
|
|
|
nfake.append(fake[i])
|
|
|
|
real = nreal
|
|
|
|
fake = nfake
|
2020-10-22 20:39:19 +00:00
|
|
|
with autocast(enabled=self.env['opt']['fp16']):
|
|
|
|
d_real = net(*real)
|
|
|
|
d_fake = net(*fake)
|
2020-08-23 23:22:34 +00:00
|
|
|
|
2020-09-11 03:35:29 +00:00
|
|
|
if self.opt['gan_type'] in ['gan', 'pixgan']:
|
2020-09-23 17:56:36 +00:00
|
|
|
self.metrics.append(("d_fake", torch.mean(d_fake)))
|
|
|
|
self.metrics.append(("d_real", torch.mean(d_real)))
|
2020-08-23 23:22:34 +00:00
|
|
|
l_real = self.criterion(d_real, True)
|
|
|
|
l_fake = self.criterion(d_fake, False)
|
|
|
|
l_total = l_real + l_fake
|
2020-10-03 04:53:42 +00:00
|
|
|
loss = l_total
|
2020-10-19 17:31:19 +00:00
|
|
|
elif self.opt['gan_type'] == 'ragan' or self.opt['gan_type'] == 'max_spread':
|
2020-09-23 17:56:36 +00:00
|
|
|
d_fake_diff = d_fake - torch.mean(d_real)
|
|
|
|
self.metrics.append(("d_fake_diff", torch.mean(d_fake_diff)))
|
2020-10-03 04:53:42 +00:00
|
|
|
loss = (self.criterion(d_real - torch.mean(d_fake), True) +
|
2020-09-23 17:56:36 +00:00
|
|
|
self.criterion(d_fake_diff, False))
|
2020-08-22 14:24:34 +00:00
|
|
|
else:
|
|
|
|
raise NotImplementedError
|
2020-10-18 16:22:10 +00:00
|
|
|
if self.min_loss != 0:
|
|
|
|
self.loss_rotating_buffer[self.rb_ptr] = loss.item()
|
|
|
|
self.rb_ptr = (self.rb_ptr + 1) % self.loss_rotating_buffer.shape[0]
|
2020-10-18 18:10:24 +00:00
|
|
|
self.metrics.append(("loss_counter", self.losses_computed))
|
2020-10-18 16:22:10 +00:00
|
|
|
if torch.mean(self.loss_rotating_buffer) < self.min_loss:
|
|
|
|
return 0
|
|
|
|
self.losses_computed += 1
|
2020-10-03 04:53:42 +00:00
|
|
|
return loss
|
2020-08-23 23:22:34 +00:00
|
|
|
|
2020-09-20 22:24:23 +00:00
|
|
|
|
|
|
|
# Computes a loss created by comparing the output of a generator to the output from the same generator when fed an
|
|
|
|
# input that has been altered randomly by rotation or flip.
|
|
|
|
# The "real" parameter to this loss is the actual output of the generator (from an injection point)
|
|
|
|
# The "fake" parameter is the LR input that produced the "real" parameter when fed through the generator.
|
|
|
|
class GeometricSimilarityGeneratorLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(GeometricSimilarityGeneratorLoss, self).__init__(opt, env)
|
|
|
|
self.opt = opt
|
|
|
|
self.generator = opt['generator']
|
|
|
|
self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
|
|
|
|
self.gen_input_for_alteration = opt['input_alteration_index'] if 'input_alteration_index' in opt.keys() else 0
|
|
|
|
self.gen_output_to_use = opt['generator_output_index'] if 'generator_output_index' in opt.keys() else None
|
|
|
|
self.detach_fake = opt['detach_fake'] if 'detach_fake' in opt.keys() else False
|
|
|
|
|
|
|
|
# Returns a random alteration and its counterpart (that undoes the alteration)
|
|
|
|
def random_alteration(self):
|
|
|
|
return random.choice([(functools.partial(torch.flip, dims=(2,)), functools.partial(torch.flip, dims=(2,))),
|
|
|
|
(functools.partial(torch.flip, dims=(3,)), functools.partial(torch.flip, dims=(3,))),
|
|
|
|
(functools.partial(torch.rot90, k=1, dims=[2,3]), functools.partial(torch.rot90, k=3, dims=[2,3])),
|
|
|
|
(functools.partial(torch.rot90, k=2, dims=[2,3]), functools.partial(torch.rot90, k=2, dims=[2,3])),
|
|
|
|
(functools.partial(torch.rot90, k=3, dims=[2,3]), functools.partial(torch.rot90, k=1, dims=[2,3]))])
|
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
net = self.env['generators'][self.generator] # Get the network from an explicit parameter.
|
|
|
|
# The <net> parameter is not reliable for generator losses since often they are combined with many networks.
|
|
|
|
fake = extract_params_from_state(self.opt['fake'], state)
|
|
|
|
alteration, undo_fn = self.random_alteration()
|
|
|
|
altered = []
|
|
|
|
for i, t in enumerate(fake):
|
|
|
|
if i == self.gen_input_for_alteration:
|
|
|
|
altered.append(alteration(t))
|
|
|
|
else:
|
|
|
|
altered.append(t)
|
2020-10-22 20:39:19 +00:00
|
|
|
|
|
|
|
with autocast(enabled=self.env['opt']['fp16']):
|
|
|
|
if self.detach_fake:
|
|
|
|
with torch.no_grad():
|
|
|
|
upsampled_altered = net(*altered)
|
|
|
|
else:
|
2020-09-20 22:24:23 +00:00
|
|
|
upsampled_altered = net(*altered)
|
|
|
|
|
2020-10-05 03:08:00 +00:00
|
|
|
if self.gen_output_to_use is not None:
|
2020-09-20 22:24:23 +00:00
|
|
|
upsampled_altered = upsampled_altered[self.gen_output_to_use]
|
|
|
|
|
|
|
|
# Undo alteration on HR image
|
|
|
|
upsampled_altered = undo_fn(upsampled_altered)
|
|
|
|
|
2020-10-03 02:40:13 +00:00
|
|
|
if self.opt['criterion'] == 'cosine':
|
|
|
|
return self.criterion(state[self.opt['real']], upsampled_altered, torch.ones(1, device=upsampled_altered.device))
|
|
|
|
else:
|
2020-10-22 22:49:34 +00:00
|
|
|
return self.criterion(state[self.opt['real']].float(), upsampled_altered.float())
|
2020-09-27 03:25:32 +00:00
|
|
|
|
|
|
|
|
|
|
|
# Computes a loss created by comparing the output of a generator to the output from the same generator when fed an
|
|
|
|
# input that has been translated in a random direction.
|
|
|
|
# The "real" parameter to this loss is the actual output of the generator on the top left image patch.
|
|
|
|
# The "fake" parameter is the output base fed into a ImagePatchInjector.
|
|
|
|
class TranslationInvarianceLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(TranslationInvarianceLoss, self).__init__(opt, env)
|
|
|
|
self.opt = opt
|
|
|
|
self.generator = opt['generator']
|
|
|
|
self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
|
|
|
|
self.gen_input_for_alteration = opt['input_alteration_index'] if 'input_alteration_index' in opt.keys() else 0
|
|
|
|
self.gen_output_to_use = opt['generator_output_index'] if 'generator_output_index' in opt.keys() else None
|
|
|
|
self.patch_size = opt['patch_size']
|
|
|
|
self.overlap = opt['overlap'] # For maximum overlap, can be calculated as 2*patch_size-image_size
|
2020-09-30 18:01:00 +00:00
|
|
|
self.detach_fake = opt['detach_fake']
|
2020-09-27 03:25:32 +00:00
|
|
|
assert(self.patch_size > self.overlap)
|
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
net = self.env['generators'][self.generator] # Get the network from an explicit parameter.
|
|
|
|
# The <net> parameter is not reliable for generator losses since often they are combined with many networks.
|
|
|
|
|
|
|
|
border_sz = self.patch_size - self.overlap
|
|
|
|
translation = random.choice([("top_right", border_sz, border_sz+self.overlap, 0, self.overlap),
|
|
|
|
("bottom_left", 0, self.overlap, border_sz, border_sz+self.overlap),
|
|
|
|
("bottom_right", 0, self.overlap, 0, self.overlap)])
|
|
|
|
trans_name, hl, hh, wl, wh = translation
|
|
|
|
# Change the "fake" input name that we are translating to one that specifies the random translation.
|
2020-09-30 18:01:00 +00:00
|
|
|
fake = self.opt['fake'].copy()
|
|
|
|
fake[self.gen_input_for_alteration] = "%s_%s" % (fake[self.gen_input_for_alteration], trans_name)
|
|
|
|
input = extract_params_from_state(fake, state)
|
2020-10-22 20:39:19 +00:00
|
|
|
|
|
|
|
with autocast(enabled=self.env['opt']['fp16']):
|
|
|
|
if self.detach_fake:
|
|
|
|
with torch.no_grad():
|
|
|
|
trans_output = net(*input)
|
|
|
|
else:
|
2020-09-30 18:01:00 +00:00
|
|
|
trans_output = net(*input)
|
2020-10-22 20:39:19 +00:00
|
|
|
|
2020-10-05 03:05:01 +00:00
|
|
|
if self.gen_output_to_use is not None:
|
2020-10-03 02:40:13 +00:00
|
|
|
fake_shared_output = trans_output[self.gen_output_to_use][:, :, hl:hh, wl:wh]
|
|
|
|
else:
|
|
|
|
fake_shared_output = trans_output[:, :, hl:hh, wl:wh]
|
2020-09-27 03:25:32 +00:00
|
|
|
|
|
|
|
# The "real" input is assumed to always come from the top left tile.
|
|
|
|
gen_output = state[self.opt['real']]
|
2020-09-30 18:01:00 +00:00
|
|
|
real_shared_output = gen_output[:, :, border_sz:border_sz+self.overlap, border_sz:border_sz+self.overlap]
|
2020-09-27 03:25:32 +00:00
|
|
|
|
2020-10-03 02:40:13 +00:00
|
|
|
if self.opt['criterion'] == 'cosine':
|
|
|
|
return self.criterion(fake_shared_output, real_shared_output, torch.ones(1, device=real_shared_output.device))
|
|
|
|
else:
|
2020-10-22 22:49:34 +00:00
|
|
|
return self.criterion(fake_shared_output.float(), real_shared_output.float())
|
2020-09-27 03:25:32 +00:00
|
|
|
|
2020-10-05 02:48:15 +00:00
|
|
|
|
|
|
|
# Computes a loss repeatedly feeding the generator downsampled inputs created from its outputs. The expectation is
|
|
|
|
# that the generator's outputs do not change on repeated forward passes.
|
|
|
|
# The "real" parameter to this loss is the actual output of the generator.
|
|
|
|
# The "fake" parameter is the expected inputs that should be fed into the generator. 'input_alteration_index' is changed
|
|
|
|
# so that it feeds the recursive input.
|
|
|
|
class RecursiveInvarianceLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(RecursiveInvarianceLoss, self).__init__(opt, env)
|
|
|
|
self.opt = opt
|
|
|
|
self.generator = opt['generator']
|
|
|
|
self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
|
|
|
|
self.gen_input_for_alteration = opt['input_alteration_index'] if 'input_alteration_index' in opt.keys() else 0
|
|
|
|
self.gen_output_to_use = opt['generator_output_index'] if 'generator_output_index' in opt.keys() else None
|
|
|
|
self.recursive_depth = opt['recursive_depth'] # How many times to recursively feed the output of the generator back into itself
|
|
|
|
self.downsample_factor = opt['downsample_factor'] # Just 1/opt['scale']. Necessary since this loss doesnt have access to opt['scale'].
|
|
|
|
assert(self.recursive_depth > 0)
|
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
net = self.env['generators'][self.generator] # Get the network from an explicit parameter.
|
|
|
|
# The <net> parameter is not reliable for generator losses since they can be combined with many networks.
|
|
|
|
|
|
|
|
gen_output = state[self.opt['real']]
|
|
|
|
recurrent_gen_output = gen_output
|
|
|
|
|
|
|
|
fake = self.opt['fake'].copy()
|
|
|
|
input = extract_params_from_state(fake, state)
|
|
|
|
for i in range(self.recursive_depth):
|
|
|
|
input[self.gen_input_for_alteration] = torch.nn.functional.interpolate(recurrent_gen_output, scale_factor=self.downsample_factor, mode="nearest")
|
2020-10-22 20:39:19 +00:00
|
|
|
with autocast(enabled=self.env['opt']['fp16']):
|
|
|
|
recurrent_gen_output = net(*input)[self.gen_output_to_use]
|
2020-10-05 02:48:15 +00:00
|
|
|
|
|
|
|
compare_real = gen_output
|
|
|
|
compare_fake = recurrent_gen_output
|
|
|
|
if self.opt['criterion'] == 'cosine':
|
|
|
|
return self.criterion(compare_real, compare_fake, torch.ones(1, device=compare_real.device))
|
|
|
|
else:
|
2020-10-22 22:49:34 +00:00
|
|
|
return self.criterion(compare_real.float(), compare_fake.float())
|
2020-10-05 02:48:15 +00:00
|
|
|
|
2020-10-07 15:03:30 +00:00
|
|
|
|
|
|
|
# Loss that pulls tensors from dim 1 of the input and repeatedly feeds them into the
|
|
|
|
# 'subtype' loss.
|
|
|
|
class RecurrentLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(RecurrentLoss, self).__init__(opt, env)
|
|
|
|
o = opt.copy()
|
|
|
|
o['type'] = opt['subtype']
|
|
|
|
o['fake'] = '_fake'
|
|
|
|
o['real'] = '_real'
|
|
|
|
self.loss = create_loss(o, self.env)
|
2020-10-21 22:59:44 +00:00
|
|
|
# Use this option to specify a differential weighting scheme for losses inside of the recurrent construct. For
|
|
|
|
# example, if later recurrent outputs should contribute more to the loss than earlier ones. When specified,
|
|
|
|
# must be a list of weights that exactly aligns with the recurrent list fed to forward().
|
|
|
|
self.recurrent_weights = opt['recurrent_weights'] if 'recurrent_weights' in opt.keys() else 1
|
2020-10-07 15:03:30 +00:00
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
total_loss = 0
|
|
|
|
st = state.copy()
|
|
|
|
real = state[self.opt['real']]
|
|
|
|
for i in range(real.shape[1]):
|
|
|
|
st['_real'] = real[:, i]
|
2020-10-11 04:39:55 +00:00
|
|
|
st['_fake'] = state[self.opt['fake']][:, i]
|
2020-10-21 22:59:44 +00:00
|
|
|
subloss = self.loss(net, st)
|
2020-10-22 04:22:28 +00:00
|
|
|
if isinstance(self.recurrent_weights, list):
|
2020-10-21 22:59:44 +00:00
|
|
|
subloss = subloss * self.recurrent_weights[i]
|
|
|
|
total_loss += subloss
|
2020-10-07 15:03:30 +00:00
|
|
|
return total_loss
|
|
|
|
|
2020-10-18 16:22:10 +00:00
|
|
|
def extra_metrics(self):
|
|
|
|
return self.loss.extra_metrics()
|
|
|
|
|
|
|
|
def clear_metrics(self):
|
|
|
|
self.loss.clear_metrics()
|
|
|
|
|
2020-10-10 01:51:44 +00:00
|
|
|
|
|
|
|
# Loss that pulls a tensor from dim 1 of the input and feeds it into a "sub" loss.
|
|
|
|
class ForElementLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super(ForElementLoss, self).__init__(opt, env)
|
|
|
|
o = opt.copy()
|
|
|
|
o['type'] = opt['subtype']
|
|
|
|
self.index = opt['index']
|
|
|
|
o['fake'] = '_fake'
|
|
|
|
o['real'] = '_real'
|
|
|
|
self.loss = create_loss(o, self.env)
|
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
st = state.copy()
|
|
|
|
st['_real'] = state[self.opt['real']][:, self.index]
|
2020-10-11 04:39:55 +00:00
|
|
|
st['_fake'] = state[self.opt['fake']][:, self.index]
|
2020-10-10 01:51:44 +00:00
|
|
|
return self.loss(net, st)
|
2020-10-18 16:22:10 +00:00
|
|
|
|
|
|
|
def extra_metrics(self):
|
|
|
|
return self.loss.extra_metrics()
|
|
|
|
|
|
|
|
def clear_metrics(self):
|
|
|
|
self.loss.clear_metrics()
|
2020-11-12 22:42:05 +00:00
|
|
|
|
|
|
|
|
|
|
|
class StyleGan2DivergenceLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super().__init__(opt, env)
|
|
|
|
self.real = opt['real']
|
|
|
|
self.fake = opt['fake']
|
|
|
|
self.discriminator = opt['discriminator']
|
|
|
|
self.for_gen = opt['gen_loss']
|
|
|
|
self.gp_frequency = opt['gradient_penalty_frequency']
|
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
D = self.env['discriminators'][self.discriminator]
|
|
|
|
fake = D(state[self.fake])
|
|
|
|
if self.for_gen:
|
|
|
|
return fake.mean()
|
|
|
|
else:
|
|
|
|
real_input = state[self.real].requires_grad_() # <-- Needed to compute gradients on the input.
|
|
|
|
real = D(real_input)
|
|
|
|
divergence_loss = (F.relu(1 + real) + F.relu(1 - fake)).mean()
|
|
|
|
|
2020-11-12 23:44:51 +00:00
|
|
|
# Apply gradient penalty. TODO: migrate this elsewhere.
|
2020-11-12 22:42:05 +00:00
|
|
|
if self.env['step'] % self.gp_frequency == 0:
|
|
|
|
from models.archs.stylegan2 import gradient_penalty
|
|
|
|
gp = gradient_penalty(real_input, real)
|
2020-11-12 23:44:51 +00:00
|
|
|
self.metrics.append(("gradient_penalty", gp.clone().detach()))
|
|
|
|
divergence_loss = divergence_loss + gp
|
2020-11-12 22:42:05 +00:00
|
|
|
|
|
|
|
real_input.requires_grad_(requires_grad=False)
|
2020-11-12 23:44:51 +00:00
|
|
|
return divergence_loss
|
2020-11-12 22:42:05 +00:00
|
|
|
|
|
|
|
|
|
|
|
class StyleGan2PathLengthLoss(ConfigurableLoss):
|
|
|
|
def __init__(self, opt, env):
|
|
|
|
super().__init__(opt, env)
|
|
|
|
self.w_styles = opt['w_styles']
|
|
|
|
self.gen = opt['gen']
|
|
|
|
self.pl_mean = None
|
|
|
|
from models.archs.stylegan2 import EMA
|
|
|
|
self.pl_length_ma = EMA(.99)
|
|
|
|
|
|
|
|
def forward(self, net, state):
|
|
|
|
w_styles = state[self.w_styles]
|
|
|
|
gen = state[self.gen]
|
|
|
|
from models.archs.stylegan2 import calc_pl_lengths
|
|
|
|
pl_lengths = calc_pl_lengths(w_styles, gen)
|
|
|
|
avg_pl_length = np.mean(pl_lengths.detach().cpu().numpy())
|
|
|
|
|
|
|
|
from models.archs.stylegan2 import is_empty
|
|
|
|
if not is_empty(self.pl_mean):
|
|
|
|
pl_loss = ((pl_lengths - self.pl_mean) ** 2).mean()
|
|
|
|
if not torch.isnan(pl_loss):
|
|
|
|
return pl_loss
|
|
|
|
else:
|
|
|
|
print("Path length loss returned NaN!")
|
|
|
|
|
|
|
|
self.pl_mean = self.pl_length_ma.update_average(self.pl_mean, avg_pl_length)
|
|
|
|
return 0
|