DL-Art-School/codes/models/steps/injectors.py

import torch.nn
from models.archs.SPSR_arch import ImageGradientNoPadding
from data.weight_scheduler import get_scheduler_for_opt
from torch.utils.checkpoint import checkpoint
import torchvision.utils as utils
#from models.steps.recursive_gen_injectors import ImageFlowInjector

# Injectors are a way to sythesize data within a step that can then be used (and reused) by loss functions.
def create_injector(opt_inject, env):
    type = opt_inject['type']
    if type == 'generator':
        return ImageGeneratorInjector(opt_inject, env)
    elif type == 'discriminator':
        return DiscriminatorInjector(opt_inject, env)
    elif type == 'scheduled_scalar':
        return ScheduledScalarInjector(opt_inject, env)
    elif type == 'img_grad':
        return ImageGradientInjector(opt_inject, env)
    elif type == 'add_noise':
        return AddNoiseInjector(opt_inject, env)
    elif type == 'greyscale':
        return GreyInjector(opt_inject, env)
    elif type == 'interpolate':
        return InterpolateInjector(opt_inject, env)
    elif type == 'imageflow':
        return ImageFlowInjector(opt_inject, env)
    elif type == 'image_patch':
        return ImagePatchInjector(opt_inject, env)
    else:
        raise NotImplementedError


class Injector(torch.nn.Module):
    def __init__(self, opt, env):
        super(Injector, self).__init__()
        self.opt = opt
        self.env = env
        if 'in' in opt.keys():
            self.input = opt['in']
        self.output = opt['out']

    # This should return a dict of new state variables.
    def forward(self, state):
        raise NotImplementedError


# Uses a generator to synthesize an image from [in] and injects the results into [out]
# Note that results are *not* detached.
class ImageGeneratorInjector(Injector):
    def __init__(self, opt, env):
        super(ImageGeneratorInjector, self).__init__(opt, env)

    def forward(self, state):
        gen = self.env['generators'][self.opt['generator']]
        if isinstance(self.input, list):
            params = [state[i] for i in self.input]
            results = gen(*params)
        else:
            results = gen(state[self.input])
        new_state = {}
        if isinstance(self.output, list):
            # Only dereference tuples or lists, not tensors.
            assert isinstance(results, list) or isinstance(results, tuple)
            for i, k in enumerate(self.output):
                new_state[k] = results[i]
        else:
            new_state[self.output] = results

        return new_state


# Injects a result from a discriminator network into the state.
class DiscriminatorInjector(Injector):
    def __init__(self, opt, env):
        super(DiscriminatorInjector, self).__init__(opt, env)

    def forward(self, state):
        d = self.env['discriminators'][self.opt['discriminator']]
        if isinstance(self.input, list):
            params = [state[i] for i in self.input]
            results = d(*params)
        else:
            results = d(state[self.input])
        new_state = {}
        if isinstance(self.output, list):
            # Only dereference tuples or lists, not tensors.
            assert isinstance(results, list) or isinstance(results, tuple)
            for i, k in enumerate(self.output):
                new_state[k] = results[i]
        else:
            new_state[self.output] = results

        return new_state


# Creates an image gradient from [in] and injects it into [out]
class ImageGradientInjector(Injector):
    def __init__(self, opt, env):
        super(ImageGradientInjector, self).__init__(opt, env)
        self.img_grad_fn = ImageGradientNoPadding().to(env['device'])

    def forward(self, state):
        return {self.opt['out']: self.img_grad_fn(state[self.opt['in']])}


# Injects a scalar that is modulated with a specified schedule. Useful for increasing or decreasing the influence
# of something over time.
class ScheduledScalarInjector(Injector):
    def __init__(self, opt, env):
        super(ScheduledScalarInjector, self).__init__(opt, env)
        self.scheduler = get_scheduler_for_opt(opt['scheduler'])

    def forward(self, state):
        return {self.opt['out']: self.scheduler.get_weight_for_step(self.env['step'])}


# Adds gaussian noise to [in], scales it to [0,[scale]] and injects into [out]
class AddNoiseInjector(Injector):
    def __init__(self, opt, env):
        super(AddNoiseInjector, self).__init__(opt, env)

    def forward(self, state):
        # Scale can be a fixed float, or a state key (e.g. from ScheduledScalarInjector).
        if isinstance(self.opt['scale'], str):
            scale = state[self.opt['scale']]
        else:
            scale = self.opt['scale']

        noise = torch.randn_like(state[self.opt['in']], device=self.env['device']) * scale
        return {self.opt['out']: state[self.opt['in']] + noise}


# Averages the channel dimension (1) of [in] and saves to [out]. Dimensions are
# kept the same, the average is simply repeated.
class GreyInjector(Injector):
    def __init__(self, opt, env):
        super(GreyInjector, self).__init__(opt, env)

    def forward(self, state):
        mean = torch.mean(state[self.opt['in']], dim=1, keepdim=True)
        mean = mean.repeat(1, 3, 1, 1)
        return {self.opt['out']: mean}


class InterpolateInjector(Injector):
    def __init__(self, opt, env):
        super(InterpolateInjector, self).__init__(opt, env)
        if 'scale_factor' in opt.keys():
            self.scale_factor = opt['scale_factor']
            self.size = None
        else:
            self.scale_factor = None
            self.size = (opt['size'], opt['size'])

    def forward(self, state):
        scaled = torch.nn.functional.interpolate(state[self.opt['in']], scale_factor=self.opt['scale_factor'],
                                                 size=self.opt['size'], mode=self.opt['mode'])
        return {self.opt['out']: scaled}


# Extracts four patches from the input image, each a square of 'patch_size'. The input images are taken from each
# of the four corners of the image. The intent of this loss is that each patch shares some part of the input, which
# can then be used in the translation invariance loss.
#
# This injector is unique in that it does not only produce the specified output label into state. Instead it produces five
# outputs for the specified label, one for each corner of the input as well as the specified output, which is the top left
# corner. See the code below to find out how this works.
#
# Another note: this injector operates differently in eval mode (e.g. when env['training']=False) - in this case, it
# simply sets all the output state variables to the input. This is so that you can feed the output of this injector
# directly into your generator in training without affecting test performance.
class ImagePatchInjector(Injector):
    def __init__(self, opt, env):
        super(ImagePatchInjector, self).__init__(opt, env)
        self.patch_size = opt['patch_size']

    def forward(self, state):
        im = state[self.opt['in']]
        if self.env['training']:
            return { self.opt['out']: im[:, :3, :self.patch_size, :self.patch_size],
                     '%s_top_left' % (self.opt['out'],): im[:, :, :self.patch_size, :self.patch_size],
                     '%s_top_right' % (self.opt['out'],): im[:, :, :self.patch_size, -self.patch_size:],
                     '%s_bottom_left' % (self.opt['out'],): im[:, :, -self.patch_size:, :self.patch_size],
                     '%s_bottom_right' % (self.opt['out'],): im[:, :, -self.patch_size:, -self.patch_size:] }
        else:
            return { self.opt['out']: im,
                     '%s_top_left' % (self.opt['out'],): im,
                     '%s_top_right' % (self.opt['out'],): im,
                     '%s_bottom_left' % (self.opt['out'],): im,
                     '%s_bottom_right' % (self.opt['out'],): im }
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`import torch.nn`
			`from models.archs.SPSR_arch import ImageGradientNoPadding`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`from data.weight_scheduler import get_scheduler_for_opt`
Add geometric loss 2020-09-20 22:24:23 +00:00			`from torch.utils.checkpoint import checkpoint`
Add ImagePatchInjector and TranslationalLoss 2020-09-27 03:25:32 +00:00			`import torchvision.utils as utils`
Add geometric loss 2020-09-20 22:24:23 +00:00			`#from models.steps.recursive_gen_injectors import ImageFlowInjector`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00
			`# Injectors are a way to sythesize data within a step that can then be used (and reused) by loss functions.`
			`def create_injector(opt_inject, env):`
			`type = opt_inject['type']`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`if type == 'generator':`
			`return ImageGeneratorInjector(opt_inject, env)`
Add a new script for loading a discriminator network and using it to filter images 2020-09-17 19:30:32 +00:00			`elif type == 'discriminator':`
			`return DiscriminatorInjector(opt_inject, env)`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`elif type == 'scheduled_scalar':`
			`return ScheduledScalarInjector(opt_inject, env)`
			`elif type == 'img_grad':`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`return ImageGradientInjector(opt_inject, env)`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`elif type == 'add_noise':`
			`return AddNoiseInjector(opt_inject, env)`
			`elif type == 'greyscale':`
			`return GreyInjector(opt_inject, env)`
Add InterpolateInjector 2020-09-03 17:32:47 +00:00			`elif type == 'interpolate':`
			`return InterpolateInjector(opt_inject, env)`
Add ImageFlowInjector 2020-09-19 16:07:00 +00:00			`elif type == 'imageflow':`
			`return ImageFlowInjector(opt_inject, env)`
Add ImagePatchInjector and TranslationalLoss 2020-09-27 03:25:32 +00:00			`elif type == 'image_patch':`
			`return ImagePatchInjector(opt_inject, env)`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`else:`
			`raise NotImplementedError`


			`class Injector(torch.nn.Module):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(Injector, self).__init__()`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.opt = opt`
			`self.env = env`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`if 'in' in opt.keys():`
			`self.input = opt['in']`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`self.output = opt['out']`

			`# This should return a dict of new state variables.`
			`def forward(self, state):`
			`raise NotImplementedError`


More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`# Uses a generator to synthesize an image from [in] and injects the results into [out]`
			`# Note that results are not detached.`
			`class ImageGeneratorInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(ImageGeneratorInjector, self).__init__(opt, env)`

			`def forward(self, state):`
			`gen = self.env['generators'][self.opt['generator']]`
Reference network 2020-08-25 17:56:59 +00:00			`if isinstance(self.input, list):`
			`params = [state[i] for i in self.input]`
			`results = gen(*params)`
			`else:`
			`results = gen(state[self.input])`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`new_state = {}`
			`if isinstance(self.output, list):`
Supporting infrastructure in ExtensibleTrainer to train spsr4 Need to be able to train 2 nets in one step: the backbone will be entirely separate with its own optimizer (for an extremely low LR). This functionality was already present, just not implemented correctly. 2020-09-12 04:57:06 +00:00			`# Only dereference tuples or lists, not tensors.`
			`assert isinstance(results, list) or isinstance(results, tuple)`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`for i, k in enumerate(self.output):`
			`new_state[k] = results[i]`
			`else:`
			`new_state[self.output] = results`

			`return new_state`


Add a new script for loading a discriminator network and using it to filter images 2020-09-17 19:30:32 +00:00			`# Injects a result from a discriminator network into the state.`
			`class DiscriminatorInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(DiscriminatorInjector, self).__init__(opt, env)`

			`def forward(self, state):`
			`d = self.env['discriminators'][self.opt['discriminator']]`
			`if isinstance(self.input, list):`
			`params = [state[i] for i in self.input]`
			`results = d(*params)`
			`else:`
			`results = d(state[self.input])`
			`new_state = {}`
			`if isinstance(self.output, list):`
			`# Only dereference tuples or lists, not tensors.`
			`assert isinstance(results, list) or isinstance(results, tuple)`
			`for i, k in enumerate(self.output):`
			`new_state[k] = results[i]`
			`else:`
			`new_state[self.output] = results`

			`return new_state`


More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`# Creates an image gradient from [in] and injects it into [out]`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`class ImageGradientInjector(Injector):`
			`def __init__(self, opt, env):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`super(ImageGradientInjector, self).__init__(opt, env)`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`self.img_grad_fn = ImageGradientNoPadding().to(env['device'])`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00
			`def forward(self, state):`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`return {self.opt['out']: self.img_grad_fn(state[self.opt['in']])}`


More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`# Injects a scalar that is modulated with a specified schedule. Useful for increasing or decreasing the influence`
			`# of something over time.`
			`class ScheduledScalarInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(ScheduledScalarInjector, self).__init__(opt, env)`
			`self.scheduler = get_scheduler_for_opt(opt['scheduler'])`

			`def forward(self, state):`
			`return {self.opt['out']: self.scheduler.get_weight_for_step(self.env['step'])}`


More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`# Adds gaussian noise to [in], scales it to [0,[scale]] and injects into [out]`
			`class AddNoiseInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(AddNoiseInjector, self).__init__(opt, env)`

			`def forward(self, state):`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`# Scale can be a fixed float, or a state key (e.g. from ScheduledScalarInjector).`
			`if isinstance(self.opt['scale'], str):`
			`scale = state[self.opt['scale']]`
			`else:`
			`scale = self.opt['scale']`

			`noise = torch.randn_like(state[self.opt['in']], device=self.env['device']) * scale`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`return {self.opt['out']: state[self.opt['in']] + noise}`


			`# Averages the channel dimension (1) of [in] and saves to [out]. Dimensions are`
			`# kept the same, the average is simply repeated.`
			`class GreyInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(GreyInjector, self).__init__(opt, env)`

			`def forward(self, state):`
			`mean = torch.mean(state[self.opt['in']], dim=1, keepdim=True)`
Add InterpolateInjector 2020-09-03 17:32:47 +00:00			`mean = mean.repeat(1, 3, 1, 1)`
More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`return {self.opt['out']: mean}`
Add InterpolateInjector 2020-09-03 17:32:47 +00:00
Add ImagePatchInjector and TranslationalLoss 2020-09-27 03:25:32 +00:00
Add InterpolateInjector 2020-09-03 17:32:47 +00:00			`class InterpolateInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(InterpolateInjector, self).__init__(opt, env)`
Fix up translational equivariance loss so it's ready for prime time 2020-09-30 18:01:00 +00:00			`if 'scale_factor' in opt.keys():`
			`self.scale_factor = opt['scale_factor']`
			`self.size = None`
			`else:`
			`self.scale_factor = None`
			`self.size = (opt['size'], opt['size'])`
Add InterpolateInjector 2020-09-03 17:32:47 +00:00
			`def forward(self, state):`
			`scaled = torch.nn.functional.interpolate(state[self.opt['in']], scale_factor=self.opt['scale_factor'],`
Fix up translational equivariance loss so it's ready for prime time 2020-09-30 18:01:00 +00:00			`size=self.opt['size'], mode=self.opt['mode'])`
Add ImageFlowInjector 2020-09-19 16:07:00 +00:00			`return {self.opt['out']: scaled}`
Add ImagePatchInjector and TranslationalLoss 2020-09-27 03:25:32 +00:00

			`# Extracts four patches from the input image, each a square of 'patch_size'. The input images are taken from each`
			`# of the four corners of the image. The intent of this loss is that each patch shares some part of the input, which`
			`# can then be used in the translation invariance loss.`
			`#`
			`# This injector is unique in that it does not only produce the specified output label into state. Instead it produces five`
			`# outputs for the specified label, one for each corner of the input as well as the specified output, which is the top left`
			`# corner. See the code below to find out how this works.`
			`#`
			`# Another note: this injector operates differently in eval mode (e.g. when env['training']=False) - in this case, it`
			`# simply sets all the output state variables to the input. This is so that you can feed the output of this injector`
			`# directly into your generator in training without affecting test performance.`
			`class ImagePatchInjector(Injector):`
			`def __init__(self, opt, env):`
			`super(ImagePatchInjector, self).__init__(opt, env)`
			`self.patch_size = opt['patch_size']`

			`def forward(self, state):`
			`im = state[self.opt['in']]`
			`if self.env['training']:`
Fix up translational equivariance loss so it's ready for prime time 2020-09-30 18:01:00 +00:00			`return { self.opt['out']: im[:, :3, :self.patch_size, :self.patch_size],`
			`'%s_top_left' % (self.opt['out'],): im[:, :, :self.patch_size, :self.patch_size],`
			`'%s_top_right' % (self.opt['out'],): im[:, :, :self.patch_size, -self.patch_size:],`
			`'%s_bottom_left' % (self.opt['out'],): im[:, :, -self.patch_size:, :self.patch_size],`
			`'%s_bottom_right' % (self.opt['out'],): im[:, :, -self.patch_size:, -self.patch_size:] }`
Add ImagePatchInjector and TranslationalLoss 2020-09-27 03:25:32 +00:00			`else:`
			`return { self.opt['out']: im,`
			`'%s_top_left' % (self.opt['out'],): im,`
			`'%s_top_right' % (self.opt['out'],): im,`
			`'%s_bottom_left' % (self.opt['out'],): im,`
			`'%s_bottom_right' % (self.opt['out'],): im }`