DL-Art-School/codes/scripts/byol/byol_uresnet_playground.py

import os
import shutil
from random import shuffle

import matplotlib.cm as cm
import torch
import torch.nn as nn
import torch.nn.functional as F
import torchvision
from PIL import Image
from torch.utils.data import DataLoader
from torchvision.models.resnet import Bottleneck
from torchvision.transforms import ToTensor, Resize
from tqdm import tqdm
import numpy as np

import utils
from data.image_folder_dataset import ImageFolderDataset
from models.pixel_level_contrastive_learning.resnet_unet import UResNet50
from models.pixel_level_contrastive_learning.resnet_unet_2 import UResNet50_2
from models.pixel_level_contrastive_learning.resnet_unet_3 import UResNet50_3
from models.resnet_with_checkpointing import resnet50
from models.spinenet_arch import SpineNet


# Computes the structural euclidean distance between [x,y]. "Structural" here means the [h,w] dimensions are preserved
# and the distance is computed across the channel dimension.
from scripts.byol.byol_spinenet_playground import find_similar_latents, create_latent_database
from utils import util
from utils.kmeans import kmeans, kmeans_predict
from utils.options import dict_to_nonedict


def structural_euc_dist(x, y):
    diff = torch.square(x - y)
    sum = torch.sum(diff, dim=-1)
    return torch.sqrt(sum)


def cosine_similarity(x, y):
    x = norm(x)
    y = norm(y)
    return -nn.CosineSimilarity()(x, y)   # probably better to just use this class to perform the calc. Just left this here to remind myself.


def key_value_difference(x, y):
    x = F.normalize(x, dim=-1, p=2)
    y = F.normalize(y, dim=-1, p=2)
    return 2 - 2 * (x * y).sum(dim=-1)


def norm(x):
    sh = x.shape
    sh_r = tuple([sh[i] if i != len(sh)-1 else 1 for i in range(len(sh))])
    return (x - torch.mean(x, dim=-1).reshape(sh_r)) / torch.std(x, dim=-1).reshape(sh_r)


def im_norm(x):
    return (((x - torch.mean(x, dim=(2,3)).reshape(-1,1,1,1)) / torch.std(x, dim=(2,3)).reshape(-1,1,1,1)) * .5) + .5


def get_image_folder_dataloader(batch_size, num_workers, target_size=256):
    dataset_opt = dict_to_nonedict({
        'name': 'amalgam',
        #'paths': ['F:\\4k6k\\datasets\\images\\imagenet_2017\\train'],
        #'paths': ['F:\\4k6k\\datasets\\ns_images\\imagesets\\imageset_1024_square_with_new'],
        'paths': ['F:\\4k6k\\datasets\\ns_images\\imagesets\\imageset_256_full'],
        #'paths': ['F:\\4k6k\\datasets\\ns_images\\imagesets\\1024_test'],
        'weights': [1],
        'target_size': target_size,
        'force_multiple': 32,
        'scale': 1
    })
    dataset = ImageFolderDataset(dataset_opt)
    return DataLoader(dataset, batch_size=batch_size, num_workers=num_workers, shuffle=True)


def produce_latent_dict(model, basename):
    batch_size = 64
    num_workers = 4
    dataloader = get_image_folder_dataloader(batch_size, num_workers)
    id = 0
    paths = []
    latents = []
    prob = None
    for batch in tqdm(dataloader):
        hq = batch['hq'].to('cuda')
        l = model(hq)
        b, c, h, w = l.shape
        dim = b*h*w
        l = l.permute(0,2,3,1).reshape(dim, c).cpu()
        # extract a random set of 10 latents from each image
        if prob is None:
            prob = torch.full((dim,), 1/(dim))
        l = l[prob.multinomial(num_samples=100, replacement=False)].split(1, dim=0)
        latents.extend(l)
        paths.extend(batch['HQ_path'])
        id += batch_size
        if id > 5000:
            print("Saving checkpoint..")
            torch.save((latents, paths), f'../{basename}_latent_dict.pth')
            id = 0


def build_kmeans(basename):
    latents, _ = torch.load(f'../{basename}_latent_dict.pth')
    shuffle(latents)
    latents = torch.cat(latents, dim=0).to('cuda')
    cluster_ids_x, cluster_centers = kmeans(latents, num_clusters=8, distance="euclidean", device=torch.device('cuda:0'), tol=0, iter_limit=5000, gravity_limit_per_iter=1000)
    torch.save((cluster_ids_x, cluster_centers), f'../{basename}_k_means_centroids.pth')


def use_kmeans(basename):
    output_path = f'../results/{basename}_kmeans_viz'
    _, centers = torch.load(f'../{basename}_k_means_centroids.pth')
    centers = centers.to('cuda')
    batch_size = 8
    num_workers = 0
    dataloader = get_image_folder_dataloader(batch_size, num_workers, target_size=256)
    colormap = cm.get_cmap('viridis', 8)
    os.makedirs(output_path, exist_ok=True)
    for i, batch in enumerate(tqdm(dataloader)):
        hq = batch['hq'].to('cuda')
        l = model(hq)
        b, c, h, w = l.shape
        dim = b*h*w
        l = l.permute(0,2,3,1).reshape(dim,c)
        pred = kmeans_predict(l, centers)
        pred = pred.reshape(b,h,w)
        img = torch.tensor(colormap(pred[:, :, :].detach().cpu().numpy()))
        scale = hq.shape[-2] / h
        torchvision.utils.save_image(torch.nn.functional.interpolate(img.permute(0,3,1,2), scale_factor=scale, mode="nearest"),
                                     f"{output_path}/{i}_categories.png")
        torchvision.utils.save_image(hq, f"{output_path}/{i}_hq.png")


if __name__ == '__main__':
    pretrained_path = '../experiments/uresnet_pixpro4_imgset.pth'
    basename = 'uresnet_pixpro4'
    model = UResNet50_3(Bottleneck, [3,4,6,3], out_dim=64).to('cuda')
    sd = torch.load(pretrained_path)
    resnet_sd = {}
    for k, v in sd.items():
        if 'target_encoder.net.' in k:
            resnet_sd[k.replace('target_encoder.net.', '')] = v
    model.load_state_dict(resnet_sd, strict=True)
    model.eval()

    with torch.no_grad():
        #find_similar_latents(model, 0, 8, structural_euc_dist)
        #create_latent_database(model, batch_size=32)
        #produce_latent_dict(model, basename)
        #uild_kmeans(basename)
        use_kmeans(basename)
Move byol scripts around 2021-01-06 21:52:17 +00:00			`import os`
			`import shutil`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`from random import shuffle`
Move byol scripts around 2021-01-06 21:52:17 +00:00
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`import matplotlib.cm as cm`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`import torch`
			`import torch.nn as nn`
			`import torch.nn.functional as F`
			`import torchvision`
			`from PIL import Image`
			`from torch.utils.data import DataLoader`
			`from torchvision.models.resnet import Bottleneck`
			`from torchvision.transforms import ToTensor, Resize`
			`from tqdm import tqdm`
			`import numpy as np`

			`import utils`
			`from data.image_folder_dataset import ImageFolderDataset`
			`from models.pixel_level_contrastive_learning.resnet_unet import UResNet50`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`from models.pixel_level_contrastive_learning.resnet_unet_2 import UResNet50_2`
			`from models.pixel_level_contrastive_learning.resnet_unet_3 import UResNet50_3`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`from models.resnet_with_checkpointing import resnet50`
			`from models.spinenet_arch import SpineNet`


			`# Computes the structural euclidean distance between [x,y]. "Structural" here means the [h,w] dimensions are preserved`
			`# and the distance is computed across the channel dimension.`
			`from scripts.byol.byol_spinenet_playground import find_similar_latents, create_latent_database`
			`from utils import util`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`from utils.kmeans import kmeans, kmeans_predict`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`from utils.options import dict_to_nonedict`


			`def structural_euc_dist(x, y):`
			`diff = torch.square(x - y)`
			`sum = torch.sum(diff, dim=-1)`
			`return torch.sqrt(sum)`


			`def cosine_similarity(x, y):`
			`x = norm(x)`
			`y = norm(y)`
			`return -nn.CosineSimilarity()(x, y) # probably better to just use this class to perform the calc. Just left this here to remind myself.`


			`def key_value_difference(x, y):`
			`x = F.normalize(x, dim=-1, p=2)`
			`y = F.normalize(y, dim=-1, p=2)`
			`return 2 - 2 * (x * y).sum(dim=-1)`


			`def norm(x):`
			`sh = x.shape`
			`sh_r = tuple([sh[i] if i != len(sh)-1 else 1 for i in range(len(sh))])`
			`return (x - torch.mean(x, dim=-1).reshape(sh_r)) / torch.std(x, dim=-1).reshape(sh_r)`


			`def im_norm(x):`
			`return (((x - torch.mean(x, dim=(2,3)).reshape(-1,1,1,1)) / torch.std(x, dim=(2,3)).reshape(-1,1,1,1)) * .5) + .5`


Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`def get_image_folder_dataloader(batch_size, num_workers, target_size=256):`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`dataset_opt = dict_to_nonedict({`
			`'name': 'amalgam',`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`#'paths': ['F:\\4k6k\\datasets\\images\\imagenet_2017\\train'],`
Support training imagenet classifier 2021-01-12 03:09:16 +00:00			`#'paths': ['F:\\4k6k\\datasets\\ns_images\\imagesets\\imageset_1024_square_with_new'],`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`'paths': ['F:\\4k6k\\datasets\\ns_images\\imagesets\\imageset_256_full'],`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`#'paths': ['F:\\4k6k\\datasets\\ns_images\\imagesets\\1024_test'],`
			`'weights': [1],`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`'target_size': target_size,`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`'force_multiple': 32,`
			`'scale': 1`
			`})`
			`dataset = ImageFolderDataset(dataset_opt)`
			`return DataLoader(dataset, batch_size=batch_size, num_workers=num_workers, shuffle=True)`


test uresnet playground mods 2021-01-23 20:46:43 +00:00			`def produce_latent_dict(model, basename):`
			`batch_size = 64`
BYOL script updates 2021-01-07 23:31:28 +00:00			`num_workers = 4`
			`dataloader = get_image_folder_dataloader(batch_size, num_workers)`
			`id = 0`
			`paths = []`
			`latents = []`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`prob = None`
BYOL script updates 2021-01-07 23:31:28 +00:00			`for batch in tqdm(dataloader):`
			`hq = batch['hq'].to('cuda')`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`l = model(hq)`
			`b, c, h, w = l.shape`
			`dim = bhw`
			`l = l.permute(0,2,3,1).reshape(dim, c).cpu()`
			`# extract a random set of 10 latents from each image`
			`if prob is None:`
			`prob = torch.full((dim,), 1/(dim))`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`l = l[prob.multinomial(num_samples=100, replacement=False)].split(1, dim=0)`
BYOL script updates 2021-01-07 23:31:28 +00:00			`latents.extend(l)`
			`paths.extend(batch['HQ_path'])`
			`id += batch_size`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`if id > 5000:`
BYOL script updates 2021-01-07 23:31:28 +00:00			`print("Saving checkpoint..")`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`torch.save((latents, paths), f'../{basename}_latent_dict.pth')`
BYOL script updates 2021-01-07 23:31:28 +00:00			`id = 0`


test uresnet playground mods 2021-01-23 20:46:43 +00:00			`def build_kmeans(basename):`
			`latents, _ = torch.load(f'../{basename}_latent_dict.pth')`
			`shuffle(latents)`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`latents = torch.cat(latents, dim=0).to('cuda')`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`cluster_ids_x, cluster_centers = kmeans(latents, num_clusters=8, distance="euclidean", device=torch.device('cuda:0'), tol=0, iter_limit=5000, gravity_limit_per_iter=1000)`
			`torch.save((cluster_ids_x, cluster_centers), f'../{basename}_k_means_centroids.pth')`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00

test uresnet playground mods 2021-01-23 20:46:43 +00:00			`def use_kmeans(basename):`
			`output_path = f'../results/{basename}_kmeans_viz'`
			`_, centers = torch.load(f'../{basename}_k_means_centroids.pth')`
Support training imagenet classifier 2021-01-12 03:09:16 +00:00			`centers = centers.to('cuda')`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`batch_size = 8`
			`num_workers = 0`
Support training imagenet classifier 2021-01-12 03:09:16 +00:00			`dataloader = get_image_folder_dataloader(batch_size, num_workers, target_size=256)`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`colormap = cm.get_cmap('viridis', 8)`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`os.makedirs(output_path, exist_ok=True)`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`for i, batch in enumerate(tqdm(dataloader)):`
			`hq = batch['hq'].to('cuda')`
			`l = model(hq)`
			`b, c, h, w = l.shape`
			`dim = bhw`
			`l = l.permute(0,2,3,1).reshape(dim,c)`
Support training imagenet classifier 2021-01-12 03:09:16 +00:00			`pred = kmeans_predict(l, centers)`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00			`pred = pred.reshape(b,h,w)`
Support training imagenet classifier 2021-01-12 03:09:16 +00:00			`img = torch.tensor(colormap(pred[:, :, :].detach().cpu().numpy()))`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`scale = hq.shape[-2] / h`
			`torchvision.utils.save_image(torch.nn.functional.interpolate(img.permute(0,3,1,2), scale_factor=scale, mode="nearest"),`
			`f"{output_path}/{i}_categories.png")`
			`torchvision.utils.save_image(hq, f"{output_path}/{i}_hq.png")`
Did anyone ask for k-means clustering? This is so cool... 2021-01-08 05:37:41 +00:00

Move byol scripts around 2021-01-06 21:52:17 +00:00			`if __name__ == '__main__':`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`pretrained_path = '../experiments/uresnet_pixpro4_imgset.pth'`
			`basename = 'uresnet_pixpro4'`
			`model = UResNet50_3(Bottleneck, [3,4,6,3], out_dim=64).to('cuda')`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`sd = torch.load(pretrained_path)`
			`resnet_sd = {}`
			`for k, v in sd.items():`
			`if 'target_encoder.net.' in k:`
			`resnet_sd[k.replace('target_encoder.net.', '')] = v`
			`model.load_state_dict(resnet_sd, strict=True)`
			`model.eval()`

			`with torch.no_grad():`
BYOL script updates 2021-01-07 23:31:28 +00:00			`#find_similar_latents(model, 0, 8, structural_euc_dist)`
Move byol scripts around 2021-01-06 21:52:17 +00:00			`#create_latent_database(model, batch_size=32)`
test uresnet playground mods 2021-01-23 20:46:43 +00:00			`#produce_latent_dict(model, basename)`
			`#uild_kmeans(basename)`
			`use_kmeans(basename)`