DL-Art-School/codes/models/steps/losses.py

import torch
import torch.nn as nn
from models.networks import define_F
from models.loss import GANLoss


def create_generator_loss(opt_loss, env):
    type = opt_loss['type']
    if type == 'pix':
        return PixLoss(opt_loss, env)
    elif type == 'feature':
        return FeatureLoss(opt_loss, env)
    elif type == 'interpreted_feature':
        return InterpretedFeatureLoss(opt_loss, env)
    elif type == 'generator_gan':
        return GeneratorGanLoss(opt_loss, env)
    elif type == 'discriminator_gan':
        return DiscriminatorGanLoss(opt_loss, env)
    else:
        raise NotImplementedError


# Converts params to a list of tensors extracted from state. Works with list/tuple params as well as scalars.
def extract_params_from_state(params, state):
    if isinstance(params, list) or isinstance(params, tuple):
        p = [state[r] for r in params]
    else:
        p = [state[params]]
    return p


class ConfigurableLoss(nn.Module):
    def __init__(self, opt, env):
        super(ConfigurableLoss, self).__init__()
        self.opt = opt
        self.env = env
        self.metrics = []

    # net is either a scalar network being trained or a list of networks being trained, depending on the configuration.
    def forward(self, net, state):
        raise NotImplementedError

    def extra_metrics(self):
        return self.metrics


def get_basic_criterion_for_name(name, device):
    if name == 'l1':
        return nn.L1Loss().to(device)
    elif name == 'l2':
        return nn.MSELoss().to(device)
    else:
        raise NotImplementedError


class PixLoss(ConfigurableLoss):
    def __init__(self, opt, env):
        super(PixLoss, self).__init__(opt, env)
        self.opt = opt
        self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])

    def forward(self, _, state):
        return self.criterion(state[self.opt['fake']], state[self.opt['real']])


class FeatureLoss(ConfigurableLoss):
    def __init__(self, opt, env):
        super(FeatureLoss, self).__init__(opt, env)
        self.opt = opt
        self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
        self.netF = define_F(which_model=opt['which_model_F'],
                             load_path=opt['load_path'] if 'load_path' in opt.keys() else None).to(self.env['device'])
        if not env['opt']['dist']:
            self.netF = torch.nn.parallel.DataParallel(self.netF)

    def forward(self, _, state):
        with torch.no_grad():
            logits_real = self.netF(state[self.opt['real']])
        logits_fake = self.netF(state[self.opt['fake']])
        return self.criterion(logits_fake, logits_real)


# Special form of feature loss which first computes the feature embedding for the truth space, then uses a second
# network which was trained to replicate that embedding on an altered input space (for example, LR or greyscale) to
# compute the embedding in the generated space. Useful for weakening the influence of the feature network in controlled
# ways.
class InterpretedFeatureLoss(ConfigurableLoss):
    def __init__(self, opt, env):
        super(InterpretedFeatureLoss, self).__init__(opt, env)
        self.opt = opt
        self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])
        self.netF_real = define_F(which_model=opt['which_model_F']).to(self.env['device'])
        self.netF_gen = define_F(which_model=opt['which_model_F'], load_path=opt['load_path']).to(self.env['device'])
        if not env['opt']['dist']:
            self.netF_real = torch.nn.parallel.DataParallel(self.netF_real)
            self.netF_gen = torch.nn.parallel.DataParallel(self.netF_gen)

    def forward(self, _, state):
        logits_real = self.netF_real(state[self.opt['real']])
        logits_fake = self.netF_gen(state[self.opt['fake']])
        return self.criterion(logits_fake, logits_real)


class GeneratorGanLoss(ConfigurableLoss):
    def __init__(self, opt, env):
        super(GeneratorGanLoss, self).__init__(opt, env)
        self.opt = opt
        self.criterion = GANLoss(opt['gan_type'], 1.0, 0.0).to(env['device'])

    def forward(self, _, state):
        netD = self.env['discriminators'][self.opt['discriminator']]
        fake = extract_params_from_state(self.opt['fake'], state)
        if self.opt['gan_type'] in ['gan', 'pixgan', 'pixgan_fea']:
            pred_g_fake = netD(*fake)
            return self.criterion(pred_g_fake, True)
        elif self.opt['gan_type'] == 'ragan':
            real = extract_params_from_state(self.opt['real'], state)
            real = [r.detach() for r in real]
            pred_d_real = netD(*real).detach()
            pred_g_fake = netD(*fake)
            return (self.cri_gan(pred_d_real - torch.mean(pred_g_fake), False) +
                    self.cri_gan(pred_g_fake - torch.mean(pred_d_real), True)) / 2
        else:
            raise NotImplementedError


class DiscriminatorGanLoss(ConfigurableLoss):
    def __init__(self, opt, env):
        super(DiscriminatorGanLoss, self).__init__(opt, env)
        self.opt = opt
        self.criterion = GANLoss(opt['gan_type'], 1.0, 0.0).to(env['device'])
        self.noise = None if 'noise' not in opt.keys() else opt['noise']

    def forward(self, net, state):
        self.metrics = []
        real = extract_params_from_state(self.opt['real'], state)
        fake = extract_params_from_state(self.opt['fake'], state)
        fake = [f.detach() for f in fake]
        if self.noise:
            # An assumption is made that the first input to the discriminator is what we want to add noise to. If not,
            # use a explicit formulation of adding noise (using an injector)
            real[0] += torch.randn_like(real[0])
            fake[0] += torch.randn_like(fake[0])
        d_real = net(*real)
        d_fake = net(*fake)

        self.metrics.append(("d_fake", torch.mean(d_fake)))
        self.metrics.append(("d_real", torch.mean(d_real)))

        if self.opt['gan_type'] in ['gan', 'pixgan']:
            l_real = self.criterion(d_real, True)
            l_fake = self.criterion(d_fake, False)
            l_total = l_real + l_fake
            return l_total
        elif self.opt['gan_type'] == 'ragan':
            return (self.criterion(d_real - torch.mean(d_fake), True) +
                    self.criterion(d_fake - torch.mean(d_real), False))
        else:
            raise NotImplementedError
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`import torch`
			`import torch.nn as nn`
			`from models.networks import define_F`
			`from models.loss import GANLoss`


			`def create_generator_loss(opt_loss, env):`
			`type = opt_loss['type']`
			`if type == 'pix':`
			`return PixLoss(opt_loss, env)`
			`elif type == 'feature':`
			`return FeatureLoss(opt_loss, env)`
Interpreted feature loss to extensibletrainer 2020-09-02 16:08:24 +00:00			`elif type == 'interpreted_feature':`
			`return InterpretedFeatureLoss(opt_loss, env)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`elif type == 'generator_gan':`
			`return GeneratorGanLoss(opt_loss, env)`
			`elif type == 'discriminator_gan':`
			`return DiscriminatorGanLoss(opt_loss, env)`
			`else:`
			`raise NotImplementedError`


Add new referencing discriminator Also extend the way losses work so that you can pass parameters into the discriminator from the config file 2020-09-11 03:35:29 +00:00			`# Converts params to a list of tensors extracted from state. Works with list/tuple params as well as scalars.`
			`def extract_params_from_state(params, state):`
			`if isinstance(params, list) or isinstance(params, tuple):`
			`p = [state[r] for r in params]`
			`else:`
			`p = [state[params]]`
			`return p`


ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`class ConfigurableLoss(nn.Module):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(ConfigurableLoss, self).__init__()`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.opt = opt`
			`self.env = env`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`self.metrics = []`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00
Supporting infrastructure in ExtensibleTrainer to train spsr4 Need to be able to train 2 nets in one step: the backbone will be entirely separate with its own optimizer (for an extremely low LR). This functionality was already present, just not implemented correctly. 2020-09-12 04:57:06 +00:00			`# net is either a scalar network being trained or a list of networks being trained, depending on the configuration.`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`def forward(self, net, state):`
			`raise NotImplementedError`

More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`def extra_metrics(self):`
			`return self.metrics`

ExtensibleTrainer work 2020-08-22 14:24:34 +00:00
			`def get_basic_criterion_for_name(name, device):`
			`if name == 'l1':`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`return nn.L1Loss().to(device)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`elif name == 'l2':`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`return nn.MSELoss().to(device)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`else:`
			`raise NotImplementedError`


			`class PixLoss(ConfigurableLoss):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(PixLoss, self).__init__(opt, env)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.opt = opt`
			`self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])`

Supporting infrastructure in ExtensibleTrainer to train spsr4 Need to be able to train 2 nets in one step: the backbone will be entirely separate with its own optimizer (for an extremely low LR). This functionality was already present, just not implemented correctly. 2020-09-12 04:57:06 +00:00			`def forward(self, _, state):`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`return self.criterion(state[self.opt['fake']], state[self.opt['real']])`


			`class FeatureLoss(ConfigurableLoss):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(FeatureLoss, self).__init__(opt, env)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.opt = opt`
			`self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])`
Interpreted feature loss to extensibletrainer 2020-09-02 16:08:24 +00:00			`self.netF = define_F(which_model=opt['which_model_F'],`
			`load_path=opt['load_path'] if 'load_path' in opt.keys() else None).to(self.env['device'])`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`if not env['opt']['dist']:`
			`self.netF = torch.nn.parallel.DataParallel(self.netF)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00
Supporting infrastructure in ExtensibleTrainer to train spsr4 Need to be able to train 2 nets in one step: the backbone will be entirely separate with its own optimizer (for an extremely low LR). This functionality was already present, just not implemented correctly. 2020-09-12 04:57:06 +00:00			`def forward(self, _, state):`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`with torch.no_grad():`
			`logits_real = self.netF(state[self.opt['real']])`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`logits_fake = self.netF(state[self.opt['fake']])`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`return self.criterion(logits_fake, logits_real)`


Interpreted feature loss to extensibletrainer 2020-09-02 16:08:24 +00:00			`# Special form of feature loss which first computes the feature embedding for the truth space, then uses a second`
			`# network which was trained to replicate that embedding on an altered input space (for example, LR or greyscale) to`
			`# compute the embedding in the generated space. Useful for weakening the influence of the feature network in controlled`
			`# ways.`
			`class InterpretedFeatureLoss(ConfigurableLoss):`
			`def __init__(self, opt, env):`
			`super(InterpretedFeatureLoss, self).__init__(opt, env)`
			`self.opt = opt`
			`self.criterion = get_basic_criterion_for_name(opt['criterion'], env['device'])`
			`self.netF_real = define_F(which_model=opt['which_model_F']).to(self.env['device'])`
			`self.netF_gen = define_F(which_model=opt['which_model_F'], load_path=opt['load_path']).to(self.env['device'])`
			`if not env['opt']['dist']:`
			`self.netF_real = torch.nn.parallel.DataParallel(self.netF_real)`
			`self.netF_gen = torch.nn.parallel.DataParallel(self.netF_gen)`

Supporting infrastructure in ExtensibleTrainer to train spsr4 Need to be able to train 2 nets in one step: the backbone will be entirely separate with its own optimizer (for an extremely low LR). This functionality was already present, just not implemented correctly. 2020-09-12 04:57:06 +00:00			`def forward(self, _, state):`
Add InterpolateInjector 2020-09-03 17:32:47 +00:00			`logits_real = self.netF_real(state[self.opt['real']])`
Interpreted feature loss to extensibletrainer 2020-09-02 16:08:24 +00:00			`logits_fake = self.netF_gen(state[self.opt['fake']])`
			`return self.criterion(logits_fake, logits_real)`


ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`class GeneratorGanLoss(ConfigurableLoss):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(GeneratorGanLoss, self).__init__(opt, env)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.opt = opt`
			`self.criterion = GANLoss(opt['gan_type'], 1.0, 0.0).to(env['device'])`

Supporting infrastructure in ExtensibleTrainer to train spsr4 Need to be able to train 2 nets in one step: the backbone will be entirely separate with its own optimizer (for an extremely low LR). This functionality was already present, just not implemented correctly. 2020-09-12 04:57:06 +00:00			`def forward(self, _, state):`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`netD = self.env['discriminators'][self.opt['discriminator']]`
Add new referencing discriminator Also extend the way losses work so that you can pass parameters into the discriminator from the config file 2020-09-11 03:35:29 +00:00			`fake = extract_params_from_state(self.opt['fake'], state)`
			`if self.opt['gan_type'] in ['gan', 'pixgan', 'pixgan_fea']:`
			`pred_g_fake = netD(*fake)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`return self.criterion(pred_g_fake, True)`
			`elif self.opt['gan_type'] == 'ragan':`
Add new referencing discriminator Also extend the way losses work so that you can pass parameters into the discriminator from the config file 2020-09-11 03:35:29 +00:00			`real = extract_params_from_state(self.opt['real'], state)`
			`real = [r.detach() for r in real]`
			`pred_d_real = netD(*real).detach()`
			`pred_g_fake = netD(*fake)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`return (self.cri_gan(pred_d_real - torch.mean(pred_g_fake), False) +`
			`self.cri_gan(pred_g_fake - torch.mean(pred_d_real), True)) / 2`
			`else:`
			`raise NotImplementedError`


			`class DiscriminatorGanLoss(ConfigurableLoss):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(DiscriminatorGanLoss, self).__init__(opt, env)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.opt = opt`
			`self.criterion = GANLoss(opt['gan_type'], 1.0, 0.0).to(env['device'])`
Allow discriminator noise to be injected at the loss level, cleans up configs 2020-09-20 03:47:52 +00:00			`self.noise = None if 'noise' not in opt.keys() else opt['noise']`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00
			`def forward(self, net, state):`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`self.metrics = []`
Add new referencing discriminator Also extend the way losses work so that you can pass parameters into the discriminator from the config file 2020-09-11 03:35:29 +00:00			`real = extract_params_from_state(self.opt['real'], state)`
			`fake = extract_params_from_state(self.opt['fake'], state)`
			`fake = [f.detach() for f in fake]`
Allow discriminator noise to be injected at the loss level, cleans up configs 2020-09-20 03:47:52 +00:00			`if self.noise:`
			`# An assumption is made that the first input to the discriminator is what we want to add noise to. If not,`
			`# use a explicit formulation of adding noise (using an injector)`
			`real[0] += torch.randn_like(real[0])`
			`fake[0] += torch.randn_like(fake[0])`
Add new referencing discriminator Also extend the way losses work so that you can pass parameters into the discriminator from the config file 2020-09-11 03:35:29 +00:00			`d_real = net(*real)`
			`d_fake = net(*fake)`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00
			`self.metrics.append(("d_fake", torch.mean(d_fake)))`
Misc fixes & adjustments 2020-09-01 13:58:11 +00:00			`self.metrics.append(("d_real", torch.mean(d_real)))`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00
Add new referencing discriminator Also extend the way losses work so that you can pass parameters into the discriminator from the config file 2020-09-11 03:35:29 +00:00			`if self.opt['gan_type'] in ['gan', 'pixgan']:`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`l_real = self.criterion(d_real, True)`
			`l_fake = self.criterion(d_fake, False)`
			`l_total = l_real + l_fake`
			`return l_total`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`elif self.opt['gan_type'] == 'ragan':`
Misc fixes & adjustments 2020-09-01 13:58:11 +00:00			`return (self.criterion(d_real - torch.mean(d_fake), True) +`
			`self.criterion(d_fake - torch.mean(d_real), False))`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`else:`
			`raise NotImplementedError`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00