DL-Art-School/codes/models/networks.py

import torch
import logging
from munch import munchify
import models.archs.SRResNet_arch as SRResNet_arch
import models.archs.discriminator_vgg_arch as SRGAN_arch
import models.archs.DiscriminatorResnet_arch as DiscriminatorResnet_arch
import models.archs.DiscriminatorResnet_arch_passthrough as DiscriminatorResnet_arch_passthrough
import models.archs.RRDBNet_arch as RRDBNet_arch
import models.archs.feature_arch as feature_arch
import models.archs.SwitchedResidualGenerator_arch as SwitchedGen_arch
import models.archs.SPSR_arch as spsr
from collections import OrderedDict

logger = logging.getLogger('base')

# Generator
def define_G(opt, net_key='network_G', scale=None):
    if net_key is not None:
        opt_net = opt[net_key]
    else:
        opt_net = opt
    if scale is None:
        scale = opt['scale']
    which_model = opt_net['which_model_G']

    # image restoration
    if which_model == 'MSRResNet':
        netG = SRResNet_arch.MSRResNet(in_nc=opt_net['in_nc'], out_nc=opt_net['out_nc'],
                                       nf=opt_net['nf'], nb=opt_net['nb'], upscale=opt_net['scale'])
    elif which_model == 'RRDBNet':
        # RRDB does scaling in two steps, so take the sqrt of the scale we actually want to achieve and feed it to RRDB.
        initial_stride = 1 if 'initial_stride' not in opt_net else opt_net['initial_stride']
        assert initial_stride == 1 or initial_stride == 2
        # Need to adjust the scale the generator sees by the stride since the stride causes a down-sample.
        gen_scale = scale * initial_stride
        netG = RRDBNet_arch.RRDBNet(in_nc=opt_net['in_nc'], out_nc=opt_net['out_nc'],
                                    nf=opt_net['nf'], nb=opt_net['nb'], scale=gen_scale, initial_stride=initial_stride)
    elif which_model == "ConfigurableSwitchedResidualGenerator2":
        netG = SwitchedGen_arch.ConfigurableSwitchedResidualGenerator2(switch_depth=opt_net['switch_depth'], switch_filters=opt_net['switch_filters'],
                                                                      switch_reductions=opt_net['switch_reductions'],
                                                                      switch_processing_layers=opt_net['switch_processing_layers'], trans_counts=opt_net['trans_counts'],
                                                                      trans_kernel_sizes=opt_net['trans_kernel_sizes'], trans_layers=opt_net['trans_layers'],
                                                                      transformation_filters=opt_net['transformation_filters'], attention_norm=opt_net['attention_norm'],
                                                                      initial_temp=opt_net['temperature'], final_temperature_step=opt_net['temperature_final_step'],
                                                                      heightened_temp_min=opt_net['heightened_temp_min'], heightened_final_step=opt_net['heightened_final_step'],
                                                                      upsample_factor=scale, add_scalable_noise_to_transforms=opt_net['add_noise'])
    elif which_model == 'spsr_net_improved':
        netG = spsr.SPSRNetSimplified(in_nc=opt_net['in_nc'], out_nc=opt_net['out_nc'], nf=opt_net['nf'],
                            nb=opt_net['nb'], upscale=opt_net['scale'])
    elif which_model == "spsr_switched":
        xforms = opt_net['num_transforms'] if 'num_transforms' in opt_net.keys() else 8
        netG = spsr.SwitchedSpsr(in_nc=3, out_nc=3, nf=opt_net['nf'], xforms=xforms, upscale=opt_net['scale'],
                                 init_temperature=opt_net['temperature'] if 'temperature' in opt_net.keys() else 10)
    elif which_model == "spsr_switched_with_ref":
        xforms = opt_net['num_transforms'] if 'num_transforms' in opt_net.keys() else 8
        netG = spsr.SwitchedSpsrWithRef(in_nc=3, out_nc=3, nf=opt_net['nf'], xforms=xforms, upscale=opt_net['scale'],
                                 init_temperature=opt_net['temperature'] if 'temperature' in opt_net.keys() else 10)
    elif which_model == "spsr_switched_with_ref2":
        xforms = opt_net['num_transforms'] if 'num_transforms' in opt_net.keys() else 8
        netG = spsr.SwitchedSpsrWithRef2(in_nc=3, out_nc=3, nf=opt_net['nf'], xforms=xforms, upscale=opt_net['scale'],
                                 init_temperature=opt_net['temperature'] if 'temperature' in opt_net.keys() else 10)
    else:
        raise NotImplementedError('Generator model [{:s}] not recognized'.format(which_model))

    return netG


class GradDiscWrapper(torch.nn.Module):
    def __init__(self, m):
        super(GradDiscWrapper, self).__init__()
        logger.info("Wrapping a discriminator..")
        self.m = m

    def forward(self, x):
        return self.m(x)

def define_D_net(opt_net, img_sz=None, wrap=False):
    which_model = opt_net['which_model_D']

    if which_model == 'discriminator_vgg_128':
        netD = SRGAN_arch.Discriminator_VGG_128(in_nc=opt_net['in_nc'], nf=opt_net['nf'], input_img_factor=img_sz / 128, extra_conv=opt_net['extra_conv'])
    elif which_model == 'discriminator_vgg_128_gn':
        netD = SRGAN_arch.Discriminator_VGG_128_GN(in_nc=opt_net['in_nc'], nf=opt_net['nf'], input_img_factor=img_sz / 128)
        if wrap:
            netD = GradDiscWrapper(netD)
    elif which_model == 'discriminator_resnet':
        netD = DiscriminatorResnet_arch.fixup_resnet34(num_filters=opt_net['nf'], num_classes=1, input_img_size=img_sz)
    elif which_model == 'discriminator_resnet_passthrough':
        netD = DiscriminatorResnet_arch_passthrough.fixup_resnet34(num_filters=opt_net['nf'], num_classes=1, input_img_size=img_sz,
                                                                   number_skips=opt_net['number_skips'], use_bn=True,
                                                                   disable_passthrough=opt_net['disable_passthrough'])
    elif which_model == 'discriminator_pix':
        netD = SRGAN_arch.Discriminator_VGG_PixLoss(in_nc=opt_net['in_nc'], nf=opt_net['nf'])
    elif which_model == "discriminator_unet":
        netD = SRGAN_arch.Discriminator_UNet(in_nc=opt_net['in_nc'], nf=opt_net['nf'])
    elif which_model == "discriminator_unet_fea":
        netD = SRGAN_arch.Discriminator_UNet_FeaOut(in_nc=opt_net['in_nc'], nf=opt_net['nf'], feature_mode=opt_net['feature_mode'])
    elif which_model == "discriminator_switched":
        netD = SRGAN_arch.Discriminator_switched(in_nc=opt_net['in_nc'], nf=opt_net['nf'], initial_temp=opt_net['initial_temp'],
                                                    final_temperature_step=opt_net['final_temperature_step'])
    elif which_model == "cross_compare_vgg128":
        netD = SRGAN_arch.CrossCompareDiscriminator(in_nc=opt_net['in_nc'], ref_channels=opt_net['ref_channels'] if 'ref_channels' in opt_net.keys() else 3, nf=opt_net['nf'], scale=opt_net['scale'])
    else:
        raise NotImplementedError('Discriminator model [{:s}] not recognized'.format(which_model))
    return netD

# Discriminator
def define_D(opt, wrap=False):
    img_sz = opt['datasets']['train']['target_size']
    opt_net = opt['network_D']
    return define_D_net(opt_net, img_sz, wrap=wrap)

def define_fixed_D(opt):
    # Note that this will not work with "old" VGG-style discriminators with dense blocks until the img_size parameter is added.
    net = define_D_net(opt)

    # Load the model parameters:
    load_net = torch.load(opt['pretrained_path'])
    load_net_clean = OrderedDict()  # remove unnecessary 'module.'
    for k, v in load_net.items():
        if k.startswith('module.'):
            load_net_clean[k[7:]] = v
        else:
            load_net_clean[k] = v
    net.load_state_dict(load_net_clean)

    # Put into eval mode, freeze the parameters and set the 'weight' field.
    net.eval()
    for k, v in net.named_parameters():
        v.requires_grad = False
    net.fdisc_weight = opt['weight']

    return net


# Define network used for perceptual loss
def define_F(which_model='vgg', use_bn=False, for_training=False, load_path=None):
    if which_model == 'vgg':
        # PyTorch pretrained VGG19-54, before ReLU.
        if use_bn:
            feature_layer = 49
        else:
            feature_layer = 34
        if for_training:
            netF = feature_arch.TrainableVGGFeatureExtractor(feature_layer=feature_layer, use_bn=use_bn,
                                                  use_input_norm=True)
        else:
            netF = feature_arch.VGGFeatureExtractor(feature_layer=feature_layer, use_bn=use_bn,
                                                    use_input_norm=True)
    elif which_model == 'wide_resnet':
        netF = feature_arch.WideResnetFeatureExtractor(use_input_norm=True)
    else:
        raise NotImplementedError

    if load_path:
        # Load the model parameters:
        load_net = torch.load(load_path)
        load_net_clean = OrderedDict()  # remove unnecessary 'module.'
        for k, v in load_net.items():
            if k.startswith('module.'):
                load_net_clean[k[7:]] = v
            else:
                load_net_clean[k] = v
        netF.load_state_dict(load_net_clean)

    if not for_training:
        # Put into eval mode, freeze the parameters and set the 'weight' field.
        netF.eval()
        for k, v in netF.named_parameters():
            v.requires_grad = False

    return netF
mmsr 2019-08-23 13:42:47 +00:00			`import torch`
Wrap vgg disc 2020-08-26 00:14:45 +00:00			`import logging`
Add updated spsr net for test 2020-09-07 23:01:48 +00:00			`from munch import munchify`
mmsr 2019-08-23 13:42:47 +00:00			`import models.archs.SRResNet_arch as SRResNet_arch`
			`import models.archs.discriminator_vgg_arch as SRGAN_arch`
Discriminator part 1 New discriminator. Includes spectral norming. 2020-04-29 05:00:29 +00:00			`import models.archs.DiscriminatorResnet_arch as DiscriminatorResnet_arch`
Add support for passthrough disc/gen Add RRDBNetXL, which performs processing at multiple image sizes. Add DiscResnet_passthrough, which allows passthrough of image at different sizes for discrimination. Adjust the rest of the repo to allow generators that return more than just a single image. 2020-05-04 20:01:43 +00:00			`import models.archs.DiscriminatorResnet_arch_passthrough as DiscriminatorResnet_arch_passthrough`
mmsr 2019-08-23 13:42:47 +00:00			`import models.archs.RRDBNet_arch as RRDBNet_arch`
Separate feature extractors out, add resnet feature extractor 2020-05-29 02:26:30 +00:00			`import models.archs.feature_arch as feature_arch`
New arch: SwitchedResidualGenerator_arch The concept here is to use switching to split the generator into two functions: interpretation and transformation. Transformation is done at the pixel level by relatively simple conv layers, while interpretation is computed at various levels by far more complicated conv stacks. The two are merged using the switching mechanism. This architecture is far less computationally intensive that RRDB. 2020-06-16 17:23:50 +00:00			`import models.archs.SwitchedResidualGenerator_arch as SwitchedGen_arch`
Integrate SPSR into SRGAN_model SPSR_model really isn't that different from SRGAN_model. Rather than continuing to re-implement everything I've done in SRGAN_model, port the new stuff from SPSR over. This really demonstrates the need to refactor SRGAN_model a bit to make it cleaner. It is quite the beast these days.. 2020-08-02 18:55:08 +00:00			`import models.archs.SPSR_arch as spsr`
Add capability to have old discriminators serve as feature networks 2020-07-31 20:59:54 +00:00			`from collections import OrderedDict`
mmsr 2019-08-23 13:42:47 +00:00
Wrap vgg disc 2020-08-26 00:14:45 +00:00			`logger = logging.getLogger('base')`

mmsr 2019-08-23 13:42:47 +00:00			`# Generator`
ExtensibleTrainer work 2020-08-22 14:24:34 +00:00			`def define_G(opt, net_key='network_G', scale=None):`
			`if net_key is not None:`
			`opt_net = opt[net_key]`
			`else:`
			`opt_net = opt`
			`if scale is None:`
			`scale = opt['scale']`
mmsr 2019-08-23 13:42:47 +00:00			`which_model = opt_net['which_model_G']`

			`# image restoration`
			`if which_model == 'MSRResNet':`
			`netG = SRResNet_arch.MSRResNet(in_nc=opt_net['in_nc'], out_nc=opt_net['out_nc'],`
			`nf=opt_net['nf'], nb=opt_net['nb'], upscale=opt_net['scale'])`
			`elif which_model == 'RRDBNet':`
Change GT_size to target_size 2020-04-22 06:37:41 +00:00			`# RRDB does scaling in two steps, so take the sqrt of the scale we actually want to achieve and feed it to RRDB.`
Add RRDB Initial Stride Allows downsampling immediately before processing, which reduces network complexity on higher resolution images but keeps a higher filter count. 2020-06-02 16:47:15 +00:00			`initial_stride = 1 if 'initial_stride' not in opt_net else opt_net['initial_stride']`
			`assert initial_stride == 1 or initial_stride == 2`
			`# Need to adjust the scale the generator sees by the stride since the stride causes a down-sample.`
			`gen_scale = scale * initial_stride`
mmsr 2019-08-23 13:42:47 +00:00			`netG = RRDBNet_arch.RRDBNet(in_nc=opt_net['in_nc'], out_nc=opt_net['out_nc'],`
Fix rrdb bug 2020-06-02 17:15:55 +00:00			`nf=opt_net['nf'], nb=opt_net['nb'], scale=gen_scale, initial_stride=initial_stride)`
Add ConfigurableSwitchComputer 2020-06-25 01:49:37 +00:00			`elif which_model == "ConfigurableSwitchedResidualGenerator2":`
SRG2 revival Big update to SRG2 architecture to pull in a lot of things that have been learned: - Use group norm instead of batch norm - Initialize the weights on the transformations low like is done in RRDB rather than using the scalar. Models live or die by their early stages, and this ones early stage is pretty weak - Transform multiplexer to use u-net like architecture. - Just use one set of configuration variables instead of a list - flat networks performed fine in this regard. 2020-07-09 23:34:51 +00:00			`netG = SwitchedGen_arch.ConfigurableSwitchedResidualGenerator2(switch_depth=opt_net['switch_depth'], switch_filters=opt_net['switch_filters'],`
Add ConfigurableSwitchComputer 2020-06-25 01:49:37 +00:00			`switch_reductions=opt_net['switch_reductions'],`
			`switch_processing_layers=opt_net['switch_processing_layers'], trans_counts=opt_net['trans_counts'],`
			`trans_kernel_sizes=opt_net['trans_kernel_sizes'], trans_layers=opt_net['trans_layers'],`
Make attention norm optional 2020-07-18 13:24:02 +00:00			`transformation_filters=opt_net['transformation_filters'], attention_norm=opt_net['attention_norm'],`
Add ConfigurableSwitchComputer 2020-06-25 01:49:37 +00:00			`initial_temp=opt_net['temperature'], final_temperature_step=opt_net['temperature_final_step'],`
Add NestedSwitchGenerator An evolution of SwitchedResidualGenerator, this variant nests attention modules upon themselves to extend the representative capacity of the model significantly. 2020-06-29 03:21:57 +00:00			`heightened_temp_min=opt_net['heightened_temp_min'], heightened_final_step=opt_net['heightened_final_step'],`
Add SpineNet & integrate with SRG New version of SRG uses SpineNet for a switch backbone. 2020-07-03 18:07:31 +00:00			`upsample_factor=scale, add_scalable_noise_to_transforms=opt_net['add_noise'])`
Add simplified SPSR architecture Basically just cleaning up the code, removing some bad conventions, and reducing complexity somewhat so that I can play around with this arch a bit more easily. 2020-08-03 16:25:37 +00:00			`elif which_model == 'spsr_net_improved':`
			`netG = spsr.SPSRNetSimplified(in_nc=opt_net['in_nc'], out_nc=opt_net['out_nc'], nf=opt_net['nf'],`
			`nb=opt_net['nb'], upscale=opt_net['scale'])`
Finish up spsr_switched 2020-08-08 03:03:48 +00:00			`elif which_model == "spsr_switched":`
Let SwitchedSpsr transform count be specified 2020-08-18 15:10:25 +00:00			`xforms = opt_net['num_transforms'] if 'num_transforms' in opt_net.keys() else 8`
Allow initial temperature to be specified to SPSR net for inference 2020-08-20 17:57:34 +00:00			`netG = spsr.SwitchedSpsr(in_nc=3, out_nc=3, nf=opt_net['nf'], xforms=xforms, upscale=opt_net['scale'],`
			`init_temperature=opt_net['temperature'] if 'temperature' in opt_net.keys() else 10)`
Reference network 2020-08-25 17:56:59 +00:00			`elif which_model == "spsr_switched_with_ref":`
			`xforms = opt_net['num_transforms'] if 'num_transforms' in opt_net.keys() else 8`
			`netG = spsr.SwitchedSpsrWithRef(in_nc=3, out_nc=3, nf=opt_net['nf'], xforms=xforms, upscale=opt_net['scale'],`
			`init_temperature=opt_net['temperature'] if 'temperature' in opt_net.keys() else 10)`
Add updated spsr net for test 2020-09-07 23:01:48 +00:00			`elif which_model == "spsr_switched_with_ref2":`
4x spsr ref (not workin) 2020-08-29 15:27:18 +00:00			`xforms = opt_net['num_transforms'] if 'num_transforms' in opt_net.keys() else 8`
Add updated spsr net for test 2020-09-07 23:01:48 +00:00			`netG = spsr.SwitchedSpsrWithRef2(in_nc=3, out_nc=3, nf=opt_net['nf'], xforms=xforms, upscale=opt_net['scale'],`
4x spsr ref (not workin) 2020-08-29 15:27:18 +00:00			`init_temperature=opt_net['temperature'] if 'temperature' in opt_net.keys() else 10)`
mmsr 2019-08-23 13:42:47 +00:00			`else:`
			`raise NotImplementedError('Generator model [{:s}] not recognized'.format(which_model))`

			`return netG`


wrap disc grad 2020-08-25 23:58:20 +00:00			`class GradDiscWrapper(torch.nn.Module):`
			`def __init__(self, m):`
			`super(GradDiscWrapper, self).__init__()`
Wrap vgg disc 2020-08-26 00:14:45 +00:00			`logger.info("Wrapping a discriminator..")`
wrap disc grad 2020-08-25 23:58:20 +00:00			`self.m = m`

Wrap vgg disc 2020-08-26 00:14:45 +00:00			`def forward(self, x):`
			`return self.m(x)`
wrap disc grad 2020-08-25 23:58:20 +00:00
			`def define_D_net(opt_net, img_sz=None, wrap=False):`
mmsr 2019-08-23 13:42:47 +00:00			`which_model = opt_net['which_model_D']`

			`if which_model == 'discriminator_vgg_128':`
Fix vgg_gn input_img_factor 2020-08-31 15:50:30 +00:00			`netD = SRGAN_arch.Discriminator_VGG_128(in_nc=opt_net['in_nc'], nf=opt_net['nf'], input_img_factor=img_sz / 128, extra_conv=opt_net['extra_conv'])`
Integrate SPSR into SRGAN_model SPSR_model really isn't that different from SRGAN_model. Rather than continuing to re-implement everything I've done in SRGAN_model, port the new stuff from SPSR over. This really demonstrates the need to refactor SRGAN_model a bit to make it cleaner. It is quite the beast these days.. 2020-08-02 18:55:08 +00:00			`elif which_model == 'discriminator_vgg_128_gn':`
Fix vgg_gn input_img_factor 2020-08-31 15:50:30 +00:00			`netD = SRGAN_arch.Discriminator_VGG_128_GN(in_nc=opt_net['in_nc'], nf=opt_net['nf'], input_img_factor=img_sz / 128)`
Wrap vgg disc 2020-08-26 00:14:45 +00:00			`if wrap:`
			`netD = GradDiscWrapper(netD)`
Discriminator part 1 New discriminator. Includes spectral norming. 2020-04-29 05:00:29 +00:00			`elif which_model == 'discriminator_resnet':`
Fixup upconv for the next attempt! 2020-05-02 01:56:14 +00:00			`netD = DiscriminatorResnet_arch.fixup_resnet34(num_filters=opt_net['nf'], num_classes=1, input_img_size=img_sz)`
Add support for passthrough disc/gen Add RRDBNetXL, which performs processing at multiple image sizes. Add DiscResnet_passthrough, which allows passthrough of image at different sizes for discrimination. Adjust the rest of the repo to allow generators that return more than just a single image. 2020-05-04 20:01:43 +00:00			`elif which_model == 'discriminator_resnet_passthrough':`
Fix skips & images samples - Makes skip connections between the generator and discriminator more extensible by adding additional configuration options for them and supporting 1 and 0 skips. - Places the temp/ directory with sample images from the training process appear in the training directory instead of the codes/ directory. 2020-05-15 19:50:49 +00:00			`netD = DiscriminatorResnet_arch_passthrough.fixup_resnet34(num_filters=opt_net['nf'], num_classes=1, input_img_size=img_sz,`
Allow passthrough discriminator to have passthrough disabled from config 2020-05-19 15:41:16 +00:00			`number_skips=opt_net['number_skips'], use_bn=True,`
			`disable_passthrough=opt_net['disable_passthrough'])`
Fix pixdisc bug 2020-07-06 03:49:09 +00:00			`elif which_model == 'discriminator_pix':`
			`netD = SRGAN_arch.Discriminator_VGG_PixLoss(in_nc=opt_net['in_nc'], nf=opt_net['nf'])`
Implement unet disc The latest discriminator architecture was already pretty much a unet. This one makes that official and uses shared layers. It also upsamples one additional time and throws out the lowest upsampling result. The intent is to delete the old vgg pixdisc, but I'll keep it around for a bit since I'm still trying out a few models with it. 2020-07-10 22:16:03 +00:00			`elif which_model == "discriminator_unet":`
			`netD = SRGAN_arch.Discriminator_UNet(in_nc=opt_net['in_nc'], nf=opt_net['nf'])`
Add u-net discriminator with feature output 2020-07-16 16:10:09 +00:00			`elif which_model == "discriminator_unet_fea":`
Allow feature discriminator unet to only output closest layer to feature output 2020-07-20 01:05:08 +00:00			`netD = SRGAN_arch.Discriminator_UNet_FeaOut(in_nc=opt_net['in_nc'], nf=opt_net['nf'], feature_mode=opt_net['feature_mode'])`
Add switched discriminator The logic is that the discriminator may be incapable of providing a truly targeted loss for all image regions since it has to be too generic (basically the same argument for the switched generator). So add some switches in! See how it works! 2020-07-23 02:52:59 +00:00			`elif which_model == "discriminator_switched":`
			`netD = SRGAN_arch.Discriminator_switched(in_nc=opt_net['in_nc'], nf=opt_net['nf'], initial_temp=opt_net['initial_temp'],`
			`final_temperature_step=opt_net['final_temperature_step'])`
Add cross-compare discriminator 2020-08-06 14:56:21 +00:00			`elif which_model == "cross_compare_vgg128":`
Enable testing in ExtensibleTrainer, fix it in SRGAN_model Also compute fea loss for this. 2020-08-31 15:41:48 +00:00			`netD = SRGAN_arch.CrossCompareDiscriminator(in_nc=opt_net['in_nc'], ref_channels=opt_net['ref_channels'] if 'ref_channels' in opt_net.keys() else 3, nf=opt_net['nf'], scale=opt_net['scale'])`
mmsr 2019-08-23 13:42:47 +00:00			`else:`
			`raise NotImplementedError('Discriminator model [{:s}] not recognized'.format(which_model))`
			`return netD`

Add capability to have old discriminators serve as feature networks 2020-07-31 20:59:54 +00:00			`# Discriminator`
wrap disc grad 2020-08-25 23:58:20 +00:00			`def define_D(opt, wrap=False):`
Add capability to have old discriminators serve as feature networks 2020-07-31 20:59:54 +00:00			`img_sz = opt['datasets']['train']['target_size']`
			`opt_net = opt['network_D']`
wrap disc grad 2020-08-25 23:58:20 +00:00			`return define_D_net(opt_net, img_sz, wrap=wrap)`
Add capability to have old discriminators serve as feature networks 2020-07-31 20:59:54 +00:00
			`def define_fixed_D(opt):`
			`# Note that this will not work with "old" VGG-style discriminators with dense blocks until the img_size parameter is added.`
			`net = define_D_net(opt)`

			`# Load the model parameters:`
			`load_net = torch.load(opt['pretrained_path'])`
			`load_net_clean = OrderedDict() # remove unnecessary 'module.'`
			`for k, v in load_net.items():`
			`if k.startswith('module.'):`
			`load_net_clean[k[7:]] = v`
			`else:`
			`load_net_clean[k] = v`
			`net.load_state_dict(load_net_clean)`

			`# Put into eval mode, freeze the parameters and set the 'weight' field.`
			`net.eval()`
			`for k, v in net.named_parameters():`
			`v.requires_grad = False`
			`net.fdisc_weight = opt['weight']`

Fix fixed_disc 2020-07-31 21:07:10 +00:00			`return net`

mmsr 2019-08-23 13:42:47 +00:00
			`# Define network used for perceptual loss`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`def define_F(which_model='vgg', use_bn=False, for_training=False, load_path=None):`
			`if which_model == 'vgg':`
Separate feature extractors out, add resnet feature extractor 2020-05-29 02:26:30 +00:00			`# PyTorch pretrained VGG19-54, before ReLU.`
			`if use_bn:`
			`feature_layer = 49`
			`else:`
			`feature_layer = 34`
Add feature_model for training custom feature nets 2020-07-31 17:20:39 +00:00			`if for_training:`
			`netF = feature_arch.TrainableVGGFeatureExtractor(feature_layer=feature_layer, use_bn=use_bn,`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`use_input_norm=True)`
Add feature_model for training custom feature nets 2020-07-31 17:20:39 +00:00			`else:`
			`netF = feature_arch.VGGFeatureExtractor(feature_layer=feature_layer, use_bn=use_bn,`
More ExtensibleTrainer work 2020-08-22 19:08:33 +00:00			`use_input_norm=True)`
			`elif which_model == 'wide_resnet':`
			`netF = feature_arch.WideResnetFeatureExtractor(use_input_norm=True)`
			`else:`
			`raise NotImplementedError`
Separate feature extractors out, add resnet feature extractor 2020-05-29 02:26:30 +00:00
Enable disjoint feature networks This is done by pre-training a feature net that predicts the features of HR images from LR images. Then use the original feature network and this new one in tandem to work only on LR/Gen images. 2020-07-31 22:29:47 +00:00			`if load_path:`
			`# Load the model parameters:`
			`load_net = torch.load(load_path)`
			`load_net_clean = OrderedDict() # remove unnecessary 'module.'`
			`for k, v in load_net.items():`
			`if k.startswith('module.'):`
			`load_net_clean[k[7:]] = v`
			`else:`
			`load_net_clean[k] = v`
			`netF.load_state_dict(load_net_clean)`

More ExtensibleTrainer work It runs now, just need to debug it to reach performance parity with SRGAN. Sweet. 2020-08-23 23:22:34 +00:00			`if not for_training:`
Enable disjoint feature networks This is done by pre-training a feature net that predicts the features of HR images from LR images. Then use the original feature network and this new one in tandem to work only on LR/Gen images. 2020-07-31 22:29:47 +00:00			`# Put into eval mode, freeze the parameters and set the 'weight' field.`
			`netF.eval()`
			`for k, v in netF.named_parameters():`
			`v.requires_grad = False`

mmsr 2019-08-23 13:42:47 +00:00			`return netF`