Rework stylegan2 divergence losses

Notably: include unet loss
2020-11-15 11:26:44 -07:00 · 2020-11-15 11:26:44 -07:00 · 99f0cfaab5
commit 99f0cfaab5
parent ea94b93a37
4 changed files with 193 additions and 71 deletions
--- a/codes/models/archs/stylegan/init.py
+++ b/codes/models/archs/stylegan/init.py
@ -0,0 +1,14 @@
+from models.archs.stylegan.stylegan2 import StyleGan2DivergenceLoss, StyleGan2PathLengthLoss
+from models.archs.stylegan.stylegan2_unet_disc import StyleGan2UnetDivergenceLoss
+
+
+def create_stylegan2_loss(opt_loss, env):
+    type = opt_loss['type']
+    if type == 'stylegan2_divergence':
+        return StyleGan2DivergenceLoss(opt_loss, env)
+    elif type == 'stylegan2_pathlen':
+        return StyleGan2PathLengthLoss(opt_loss, env)
+    elif type == 'stylegan2_unet_divergence':
+        return StyleGan2UnetDivergenceLoss(opt_loss, env)
+    else:
+        raise NotImplementedError
--- a/codes/models/archs/stylegan/stylegan2.py
+++ b/codes/models/archs/stylegan/stylegan2.py
@ -13,6 +13,7 @@ from torch import nn
 from torch.autograd import grad as torch_grad
 from vector_quantize_pytorch import VectorQuantize

+from models.steps.losses import ConfigurableLoss
 from utils.util import checkpoint

 try:
@ -304,6 +305,9 @@ class StyleGan2Augmentor(nn.Module):
        if detach:
            images = images.detach()

+        # Save away for use elsewhere (e.g. unet loss)
+        self.aug_images = images
+
        return self.D(images)


@ -694,3 +698,68 @@ class StyleGan2Discriminator(nn.Module):
        for m in self.modules():
            if type(m) in {nn.Conv2d, nn.Linear}:
                nn.init.kaiming_normal_(m.weight, a=0, mode='fan_in', nonlinearity='leaky_relu')
+
+
+class StyleGan2DivergenceLoss(ConfigurableLoss):
+    def __init__(self, opt, env):
+        super().__init__(opt, env)
+        self.real = opt['real']
+        self.fake = opt['fake']
+        self.discriminator = opt['discriminator']
+        self.for_gen = opt['gen_loss']
+        self.gp_frequency = opt['gradient_penalty_frequency']
+        self.noise = opt['noise'] if 'noise' in opt.keys() else 0
+
+    def forward(self, net, state):
+        real_input = state[self.real]
+        fake_input = state[self.fake]
+        if self.noise != 0:
+            fake_input = fake_input + torch.rand_like(fake_input) * self.noise
+            real_input = real_input + torch.rand_like(real_input) * self.noise
+
+        D = self.env['discriminators'][self.discriminator]
+        fake = D(fake_input)
+        if self.for_gen:
+            return fake.mean()
+        else:
+            real_input.requires_grad_()  # <-- Needed to compute gradients on the input.
+            real = D(real_input)
+            divergence_loss = (F.relu(1 + real) + F.relu(1 - fake)).mean()
+
+            # Apply gradient penalty. TODO: migrate this elsewhere.
+            if self.env['step'] % self.gp_frequency == 0:
+                from models.archs.stylegan.stylegan2 import gradient_penalty
+                gp = gradient_penalty(real_input, real)
+                self.metrics.append(("gradient_penalty", gp.clone().detach()))
+                divergence_loss = divergence_loss + gp
+
+            real_input.requires_grad_(requires_grad=False)
+            return divergence_loss
+
+
+class StyleGan2PathLengthLoss(ConfigurableLoss):
+    def __init__(self, opt, env):
+        super().__init__(opt, env)
+        self.w_styles = opt['w_styles']
+        self.gen = opt['gen']
+        self.pl_mean = None
+        from models.archs.stylegan.stylegan2 import EMA
+        self.pl_length_ma = EMA(.99)
+
+    def forward(self, net, state):
+        w_styles = state[self.w_styles]
+        gen = state[self.gen]
+        from models.archs.stylegan.stylegan2 import calc_pl_lengths
+        pl_lengths = calc_pl_lengths(w_styles, gen)
+        avg_pl_length = np.mean(pl_lengths.detach().cpu().numpy())
+
+        from models.archs.stylegan.stylegan2 import is_empty
+        if not is_empty(self.pl_mean):
+            pl_loss = ((pl_lengths - self.pl_mean) ** 2).mean()
+            if not torch.isnan(pl_loss):
+                return pl_loss
+            else:
+                print("Path length loss returned NaN!")
+
+        self.pl_mean = self.pl_length_ma.update_average(self.pl_mean, avg_pl_length)
+        return 0
--- a/codes/models/archs/stylegan/stylegan2_unet_disc.py
+++ b/codes/models/archs/stylegan/stylegan2_unet_disc.py
@ -1,10 +1,14 @@
 from functools import partial
 from math import log2
+from random import random
+import numpy as np

 import torch
 import torch.nn as nn
+import torch.nn.functional as F

 from models.archs.stylegan.stylegan2 import attn_and_ff
+from models.steps.losses import ConfigurableLoss


 def leaky_relu(p=0.2):
@ -132,4 +136,105 @@ class StyleGan2UnetDiscriminator(nn.Module):
            x = up_block(x, res)

        dec_out = self.conv_out(x)
-        return dec_out
+        return dec_out, enc_out
+
+
+def warmup(start, end, max_steps, current_step):
+    if current_step > max_steps:
+        return end
+    return (end - start) * (current_step / max_steps) + start
+
+
+def mask_src_tgt(source, target, mask):
+    return source * mask + (1 - mask) * target
+
+
+def cutmix(source, target, coors, alpha = 1.):
+    source, target = map(torch.clone, (source, target))
+    ((y0, y1), (x0, x1)), _ = coors
+    source[:, :, y0:y1, x0:x1] = target[:, :, y0:y1, x0:x1]
+    return source
+
+
+def cutmix_coordinates(height, width, alpha = 1.):
+    lam = np.random.beta(alpha, alpha)
+
+    cx = np.random.uniform(0, width)
+    cy = np.random.uniform(0, height)
+    w = width * np.sqrt(1 - lam)
+    h = height * np.sqrt(1 - lam)
+    x0 = int(np.round(max(cx - w / 2, 0)))
+    x1 = int(np.round(min(cx + w / 2, width)))
+    y0 = int(np.round(max(cy - h / 2, 0)))
+    y1 = int(np.round(min(cy + h / 2, height)))
+
+    return ((y0, y1), (x0, x1)), lam
+
+
+class StyleGan2UnetDivergenceLoss(ConfigurableLoss):
+    def __init__(self, opt, env):
+        super().__init__(opt, env)
+        self.real = opt['real']
+        self.fake = opt['fake']
+        self.discriminator = opt['discriminator']
+        self.for_gen = opt['gen_loss']
+        self.gp_frequency = opt['gradient_penalty_frequency']
+        self.noise = opt['noise'] if 'noise' in opt.keys() else 0
+        self.image_size = opt['image_size']
+
+    def forward(self, net, state):
+        real_input = state[self.real]
+        fake_input = state[self.fake]
+        if self.noise != 0:
+            fake_input = fake_input + torch.rand_like(fake_input) * self.noise
+            real_input = real_input + torch.rand_like(real_input) * self.noise
+
+        D = self.env['discriminators'][self.discriminator]
+        fake_dec, fake_enc = D(fake_input)
+        fake_aug_images = D.aug_images
+        if self.for_gen:
+            return fake_enc.mean() + F.relu(1 + fake_dec).mean()
+        else:
+            dec_loss_coef = warmup(0, 1., 30000, self.env['step'])
+            cutmix_prob = warmup(0, 0.25, 30000, self.env['step'])
+            apply_cutmix = random() < cutmix_prob
+
+            real_input.requires_grad_()  # <-- Needed to compute gradients on the input.
+            real_dec, real_enc = D(real_input)
+            real_aug_images = D.aug_images
+            enc_divergence = (F.relu(1 + real_enc) + F.relu(1 - fake_enc)).mean()
+            dec_divergence = (F.relu(1 + real_dec) + F.relu(1 - fake_dec)).mean()
+            divergence_loss = enc_divergence + dec_divergence * dec_loss_coef
+
+            if apply_cutmix:
+                mask = cutmix(
+                    torch.ones_like(real_dec),
+                    torch.zeros_like(real_dec),
+                    cutmix_coordinates(self.image_size, self.image_size)
+                )
+
+                if random() > 0.5:
+                    mask = 1 - mask
+
+                cutmix_images = mask_src_tgt(real_aug_images, fake_aug_images, mask)
+                cutmix_enc_out, cutmix_dec_out = self.GAN.D(cutmix_images)
+
+                cutmix_enc_divergence = F.relu(1 - cutmix_enc_out).mean()
+                cutmix_dec_divergence = F.relu(1 + (mask * 2 - 1) * cutmix_dec_out).mean()
+                disc_loss = divergence_loss + cutmix_enc_divergence + cutmix_dec_divergence
+
+                cr_cutmix_dec_out = mask_src_tgt(real_dec, fake_dec, mask)
+                cr_loss = F.mse_loss(cutmix_dec_out, cr_cutmix_dec_out) * self.cr_weight
+                self.last_cr_loss = cr_loss.clone().detach().item()
+
+                disc_loss = disc_loss + cr_loss * dec_loss_coef
+
+            # Apply gradient penalty. TODO: migrate this elsewhere.
+            if self.env['step'] % self.gp_frequency == 0:
+                from models.archs.stylegan.stylegan2 import gradient_penalty
+                gp = gradient_penalty(real_input, real)
+                self.metrics.append(("gradient_penalty", gp.clone().detach()))
+                disc_loss = disc_loss + gp
+
+            real_input.requires_grad_(requires_grad=False)
+            return disc_loss
--- a/codes/models/steps/losses.py
+++ b/codes/models/steps/losses.py
@ -15,6 +15,9 @@ def create_loss(opt_loss, env):
    if 'teco_' in type:
        from models.steps.tecogan_losses import create_teco_loss
        return create_teco_loss(opt_loss, env)
+    elif 'stylegan2_' in type:
+        from models.archs.stylegan import create_stylegan2_loss
+        return create_stylegan2_loss(opt_loss, env)
    elif type == 'pix':
        return PixLoss(opt_loss, env)
    elif type == 'direct':
@ -37,10 +40,6 @@ def create_loss(opt_loss, env):
        return RecurrentLoss(opt_loss, env)
    elif type == 'for_element':
        return ForElementLoss(opt_loss, env)
-    elif type == 'stylegan2_divergence':
-        return StyleGan2DivergenceLoss(opt_loss, env)
-    elif type == 'stylegan2_pathlen':
-        return StyleGan2PathLengthLoss(opt_loss, env)
    else:
        raise NotImplementedError

@ -487,68 +486,3 @@ class ForElementLoss(ConfigurableLoss):

    def clear_metrics(self):
        self.loss.clear_metrics()
-
-
-class StyleGan2DivergenceLoss(ConfigurableLoss):
-    def __init__(self, opt, env):
-        super().__init__(opt, env)
-        self.real = opt['real']
-        self.fake = opt['fake']
-        self.discriminator = opt['discriminator']
-        self.for_gen = opt['gen_loss']
-        self.gp_frequency = opt['gradient_penalty_frequency']
-        self.noise = opt['noise'] if 'noise' in opt.keys() else 0
-
-    def forward(self, net, state):
-        real_input = state[self.real]
-        fake_input = state[self.fake]
-        if self.noise != 0:
-            fake_input = fake_input + torch.rand_like(fake_input) * self.noise
-            real_input = real_input + torch.rand_like(real_input) * self.noise
-
-        D = self.env['discriminators'][self.discriminator]
-        fake = D(fake_input)
-        if self.for_gen:
-            return fake.mean()
-        else:
-            real_input.requires_grad_()  # <-- Needed to compute gradients on the input.
-            real = D(real_input)
-            divergence_loss = (F.relu(1 + real) + F.relu(1 - fake)).mean()
-
-            # Apply gradient penalty. TODO: migrate this elsewhere.
-            if self.env['step'] % self.gp_frequency == 0:
-                from models.archs.stylegan.stylegan2 import gradient_penalty
-                gp = gradient_penalty(real_input, real)
-                self.metrics.append(("gradient_penalty", gp.clone().detach()))
-                divergence_loss = divergence_loss + gp
-
-            real_input.requires_grad_(requires_grad=False)
-            return divergence_loss
-
-
-class StyleGan2PathLengthLoss(ConfigurableLoss):
-    def __init__(self, opt, env):
-        super().__init__(opt, env)
-        self.w_styles = opt['w_styles']
-        self.gen = opt['gen']
-        self.pl_mean = None
-        from models.archs.stylegan.stylegan2 import EMA
-        self.pl_length_ma = EMA(.99)
-
-    def forward(self, net, state):
-        w_styles = state[self.w_styles]
-        gen = state[self.gen]
-        from models.archs.stylegan.stylegan2 import calc_pl_lengths
-        pl_lengths = calc_pl_lengths(w_styles, gen)
-        avg_pl_length = np.mean(pl_lengths.detach().cpu().numpy())
-
-        from models.archs.stylegan.stylegan2 import is_empty
-        if not is_empty(self.pl_mean):
-            pl_loss = ((pl_lengths - self.pl_mean) ** 2).mean()
-            if not torch.isnan(pl_loss):
-                return pl_loss
-            else:
-                print("Path length loss returned NaN!")
-
-        self.pl_mean = self.pl_length_ma.update_average(self.pl_mean, avg_pl_length)
-        return 0