DL-Art-School/codes/models/styled_sr/styled_sr.py

from math import log2
from random import random

import torch
import torch.nn as nn
import torch.nn.functional as F

from models.RRDBNet_arch import RRDB
from models.arch_util import ConvGnLelu, default_init_weights
from models.styled_sr.stylegan2_base import StyleVectorizer, GeneratorBlock, Conv2DMod, leaky_relu, Blur
from trainer.networks import register_model
from utils.util import checkpoint, opt_get


class EncoderRRDB(nn.Module):
    def __init__(self, mid_channels=64, output_channels=32, growth_channels=32, init_weight=.1):
        super(EncoderRRDB, self).__init__()
        for i in range(5):
            out_channels = output_channels if i == 4 else growth_channels
            self.add_module(
                f'conv{i+1}',
                nn.Conv2d(mid_channels + i * growth_channels, out_channels, 3,
                          1, 1))
        self.lrelu = nn.LeakyReLU(negative_slope=0.2, inplace=True)
        for i in range(5):
            default_init_weights(getattr(self, f'conv{i+1}'), init_weight)

    def forward(self, x):
        x1 = self.lrelu(self.conv1(x))
        x2 = self.lrelu(self.conv2(torch.cat((x, x1), 1)))
        x3 = self.lrelu(self.conv3(torch.cat((x, x1, x2), 1)))
        x4 = self.lrelu(self.conv4(torch.cat((x, x1, x2, x3), 1)))
        x5 = self.conv5(torch.cat((x, x1, x2, x3, x4), 1))
        return x5


class StyledSrEncoder(nn.Module):
    def __init__(self, fea_out=256, initial_stride=1):
        super().__init__()
        # Current assumes fea_out=256.
        self.initial_conv = ConvGnLelu(3, 32, kernel_size=7, stride=initial_stride, norm=False, activation=False, bias=True)
        self.rrdbs = nn.ModuleList([
           EncoderRRDB(32),
           EncoderRRDB(64),
           EncoderRRDB(96),
           EncoderRRDB(128),
           EncoderRRDB(160),
           EncoderRRDB(192),
           EncoderRRDB(224)])

    def forward(self, x):
        fea = self.initial_conv(x)
        for rrdb in self.rrdbs:
            fea = torch.cat([fea, checkpoint(rrdb, fea)], dim=1)
        return fea


class Generator(nn.Module):
    def __init__(self, image_size, latent_dim, initial_stride=1, start_level=3, upsample_levels=2):
        super().__init__()
        total_levels = upsample_levels + 1  # The first level handles the raw encoder output and doesn't upsample.
        self.image_size = image_size
        self.scale = 2 ** upsample_levels
        self.latent_dim = latent_dim
        self.num_layers = total_levels
        filters = [
            512,  # 4x4
            512,  # 8x8
            512,  # 16x16
            256,  # 32x32
            128,  # 64x64
            64,   # 128x128
            32,   # 256x256
            16,   # 512x512
            8,    # 1024x1024
        ]

        self.encoder = StyledSrEncoder(filters[start_level], initial_stride)

        in_out_pairs = list(zip(filters[:-1], filters[1:]))
        self.blocks = nn.ModuleList([])
        for ind in range(start_level, start_level+total_levels):
            in_chan, out_chan = in_out_pairs[ind]
            not_first = ind != start_level
            not_last = ind != (start_level+total_levels-1)
            block = GeneratorBlock(
                latent_dim,
                in_chan,
                out_chan,
                upsample=not_first,
                upsample_rgb=not_last
            )
            self.blocks.append(block)

    def forward(self, lr, styles):
        b, c, h, w = lr.shape
        x = self.encoder(lr)

        styles = styles.transpose(0, 1)
        input_noise = torch.rand(b, h * self.scale, w * self.scale, 1).to(lr.device)
        if h != x.shape[-2]:
            rgb = F.interpolate(lr, size=x.shape[2:], mode="area")
        else:
            rgb = lr
        for style, block in zip(styles, self.blocks):
            x, rgb = checkpoint(block, x, rgb, style, input_noise)

        return rgb


class StyledSrGenerator(nn.Module):
    def __init__(self, image_size, initial_stride=1, latent_dim=512, style_depth=8, lr_mlp=.1):
        super().__init__()
        self.vectorizer = StyleVectorizer(latent_dim, style_depth, lr_mul=lr_mlp)
        self.gen = Generator(image_size=image_size, latent_dim=latent_dim, initial_stride=initial_stride)
        self.mixed_prob = .9
        self._init_weights()

    def _init_weights(self):
        for m in self.modules():
            if type(m) in {nn.Conv2d, nn.Linear} and hasattr(m, 'weight'):
                nn.init.kaiming_normal_(m.weight, a=0, mode='fan_in', nonlinearity='leaky_relu')

        for block in self.gen.blocks:
            nn.init.zeros_(block.to_noise1.weight)
            nn.init.zeros_(block.to_noise2.weight)
            nn.init.zeros_(block.to_noise1.bias)
            nn.init.zeros_(block.to_noise2.bias)

    def forward(self, x):
        b, f, h, w = x.shape

        # Synthesize style latents from noise.
        style = torch.randn(b*2, self.gen.latent_dim).to(x.device)
        w = self.vectorizer(style)

        # Randomly distribute styles across layers
        w_styles = w[:,None,:].expand(-1, self.gen.num_layers, -1).clone()
        for j in range(b):
            cutoff = int(torch.rand(()).numpy() * self.gen.num_layers)
            if cutoff == self.gen.num_layers or random() > self.mixed_prob:
                w_styles[j] = w_styles[j*2]
            else:
                w_styles[j, :cutoff] = w_styles[j*2, :cutoff]
                w_styles[j, cutoff:] = w_styles[j*2+1, cutoff:]
        w_styles = w_styles[:b]

        out = self.gen(x, w_styles)

        # Compute the net, areal, pixel-wise additions made on top of the LR image.
        out_down = F.interpolate(out, size=(x.shape[-2], x.shape[-1]), mode="area")
        diff = torch.sum(torch.abs(out_down - x), dim=[1,2,3])

        return out, diff, w_styles


if __name__ == '__main__':
    gen = StyledSrGenerator(128, 2)
    out = gen(torch.rand(1,3,64,64))
    print([o.shape for o in out])


@register_model
def register_styled_sr(opt_net, opt):
    return StyledSrGenerator(128, initial_stride=opt_get(opt_net, ['initial_stride'], 1))
Styled SR model 2021-01-01 03:54:18 +00:00			`from math import log2`
			`from random import random`

			`import torch`
			`import torch.nn as nn`
			`import torch.nn.functional as F`

			`from models.RRDBNet_arch import RRDB`
			`from models.arch_util import ConvGnLelu, default_init_weights`
More mods to support styledsr 2021-01-04 18:32:28 +00:00			`from models.styled_sr.stylegan2_base import StyleVectorizer, GeneratorBlock, Conv2DMod, leaky_relu, Blur`
Styled SR model 2021-01-01 03:54:18 +00:00			`from trainer.networks import register_model`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`from utils.util import checkpoint, opt_get`
Styled SR model 2021-01-01 03:54:18 +00:00

			`class EncoderRRDB(nn.Module):`
			`def __init__(self, mid_channels=64, output_channels=32, growth_channels=32, init_weight=.1):`
			`super(EncoderRRDB, self).__init__()`
			`for i in range(5):`
			`out_channels = output_channels if i == 4 else growth_channels`
			`self.add_module(`
			`f'conv{i+1}',`
			`nn.Conv2d(mid_channels + i * growth_channels, out_channels, 3,`
			`1, 1))`
			`self.lrelu = nn.LeakyReLU(negative_slope=0.2, inplace=True)`
			`for i in range(5):`
			`default_init_weights(getattr(self, f'conv{i+1}'), init_weight)`

			`def forward(self, x):`
			`x1 = self.lrelu(self.conv1(x))`
			`x2 = self.lrelu(self.conv2(torch.cat((x, x1), 1)))`
			`x3 = self.lrelu(self.conv3(torch.cat((x, x1, x2), 1)))`
			`x4 = self.lrelu(self.conv4(torch.cat((x, x1, x2, x3), 1)))`
			`x5 = self.conv5(torch.cat((x, x1, x2, x3, x4), 1))`
			`return x5`


			`class StyledSrEncoder(nn.Module):`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`def __init__(self, fea_out=256, initial_stride=1):`
Styled SR model 2021-01-01 03:54:18 +00:00			`super().__init__()`
			`# Current assumes fea_out=256.`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`self.initial_conv = ConvGnLelu(3, 32, kernel_size=7, stride=initial_stride, norm=False, activation=False, bias=True)`
Styled SR model 2021-01-01 03:54:18 +00:00			`self.rrdbs = nn.ModuleList([`
			`EncoderRRDB(32),`
			`EncoderRRDB(64),`
			`EncoderRRDB(96),`
			`EncoderRRDB(128),`
			`EncoderRRDB(160),`
			`EncoderRRDB(192),`
			`EncoderRRDB(224)])`

			`def forward(self, x):`
			`fea = self.initial_conv(x)`
			`for rrdb in self.rrdbs:`
			`fea = torch.cat([fea, checkpoint(rrdb, fea)], dim=1)`
			`return fea`


			`class Generator(nn.Module):`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`def __init__(self, image_size, latent_dim, initial_stride=1, start_level=3, upsample_levels=2):`
Styled SR model 2021-01-01 03:54:18 +00:00			`super().__init__()`
			`total_levels = upsample_levels + 1 # The first level handles the raw encoder output and doesn't upsample.`
			`self.image_size = image_size`
			`self.scale = 2 ** upsample_levels`
			`self.latent_dim = latent_dim`
			`self.num_layers = total_levels`
			`filters = [`
			`512, # 4x4`
			`512, # 8x8`
			`512, # 16x16`
			`256, # 32x32`
			`128, # 64x64`
			`64, # 128x128`
			`32, # 256x256`
			`16, # 512x512`
			`8, # 1024x1024`
			`]`

Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`self.encoder = StyledSrEncoder(filters[start_level], initial_stride)`
Styled SR model 2021-01-01 03:54:18 +00:00
			`in_out_pairs = list(zip(filters[:-1], filters[1:]))`
			`self.blocks = nn.ModuleList([])`
			`for ind in range(start_level, start_level+total_levels):`
			`in_chan, out_chan = in_out_pairs[ind]`
			`not_first = ind != start_level`
			`not_last = ind != (start_level+total_levels-1)`
			`block = GeneratorBlock(`
			`latent_dim,`
			`in_chan,`
			`out_chan,`
			`upsample=not_first,`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`upsample_rgb=not_last`
Styled SR model 2021-01-01 03:54:18 +00:00			`)`
			`self.blocks.append(block)`

			`def forward(self, lr, styles):`
			`b, c, h, w = lr.shape`
styled_sr: fix bug when using initial_stride 2021-01-01 19:13:21 +00:00			`x = self.encoder(lr)`
Styled SR model 2021-01-01 03:54:18 +00:00
			`styles = styles.transpose(0, 1)`
styled_sr: fix bug when using initial_stride 2021-01-01 19:13:21 +00:00			`input_noise = torch.rand(b, h * self.scale, w * self.scale, 1).to(lr.device)`
			`if h != x.shape[-2]:`
			`rgb = F.interpolate(lr, size=x.shape[2:], mode="area")`
			`else:`
			`rgb = lr`
Styled SR model 2021-01-01 03:54:18 +00:00			`for style, block in zip(styles, self.blocks):`
			`x, rgb = checkpoint(block, x, rgb, style, input_noise)`

			`return rgb`


			`class StyledSrGenerator(nn.Module):`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`def __init__(self, image_size, initial_stride=1, latent_dim=512, style_depth=8, lr_mlp=.1):`
Styled SR model 2021-01-01 03:54:18 +00:00			`super().__init__()`
			`self.vectorizer = StyleVectorizer(latent_dim, style_depth, lr_mul=lr_mlp)`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`self.gen = Generator(image_size=image_size, latent_dim=latent_dim, initial_stride=initial_stride)`
Styled SR model 2021-01-01 03:54:18 +00:00			`self.mixed_prob = .9`
			`self._init_weights()`

			`def _init_weights(self):`
			`for m in self.modules():`
			`if type(m) in {nn.Conv2d, nn.Linear} and hasattr(m, 'weight'):`
			`nn.init.kaiming_normal_(m.weight, a=0, mode='fan_in', nonlinearity='leaky_relu')`

			`for block in self.gen.blocks:`
			`nn.init.zeros_(block.to_noise1.weight)`
			`nn.init.zeros_(block.to_noise2.weight)`
			`nn.init.zeros_(block.to_noise1.bias)`
			`nn.init.zeros_(block.to_noise2.bias)`

			`def forward(self, x):`
			`b, f, h, w = x.shape`

			`# Synthesize style latents from noise.`
			`style = torch.randn(b*2, self.gen.latent_dim).to(x.device)`
			`w = self.vectorizer(style)`

			`# Randomly distribute styles across layers`
			`w_styles = w[:,None,:].expand(-1, self.gen.num_layers, -1).clone()`
			`for j in range(b):`
			`cutoff = int(torch.rand(()).numpy() * self.gen.num_layers)`
			`if cutoff == self.gen.num_layers or random() > self.mixed_prob:`
			`w_styles[j] = w_styles[j*2]`
			`else:`
			`w_styles[j, :cutoff] = w_styles[j*2, :cutoff]`
			`w_styles[j, cutoff:] = w_styles[j*2+1, cutoff:]`
			`w_styles = w_styles[:b]`

			`out = self.gen(x, w_styles)`

			`# Compute the net, areal, pixel-wise additions made on top of the LR image.`
			`out_down = F.interpolate(out, size=(x.shape[-2], x.shape[-1]), mode="area")`
			`diff = torch.sum(torch.abs(out_down - x), dim=[1,2,3])`

			`return out, diff, w_styles`


			`if __name__ == '__main__':`
styled_sr: fix bug when using initial_stride 2021-01-01 19:13:21 +00:00			`gen = StyledSrGenerator(128, 2)`
			`out = gen(torch.rand(1,3,64,64))`
Styled SR model 2021-01-01 03:54:18 +00:00			`print([o.shape for o in out])`


			`@register_model`
Add initial_stride term to style_sr Also fix fid and a networks.py issue. 2021-01-01 18:59:36 +00:00			`def register_styled_sr(opt_net, opt):`
			`return StyledSrGenerator(128, initial_stride=opt_get(opt_net, ['initial_stride'], 1))`