From 438dcaccc5f2524f5095fad11fb1bacb18dd7e72 Mon Sep 17 00:00:00 2001 From: James Betker Date: Sat, 16 Jul 2022 13:58:52 -0600 Subject: [PATCH] misc --- codes/trainer/eval/music_diffusion_fid.py | 6 +++--- codes/trainer/injectors/audio_injectors.py | 2 +- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/codes/trainer/eval/music_diffusion_fid.py b/codes/trainer/eval/music_diffusion_fid.py index 9dfc5986..352a66c6 100644 --- a/codes/trainer/eval/music_diffusion_fid.py +++ b/codes/trainer/eval/music_diffusion_fid.py @@ -438,18 +438,18 @@ class MusicDiffusionFid(evaluator.Evaluator): if __name__ == '__main__': diffusion = load_model_from_config('X:\\dlas\\experiments\\train_music_cheater_gen.yml', 'generator', also_load_savepoint=False, - load_path='X:\\dlas\\experiments\\train_music_cheater_gen_v5_cosine_40_lyr\\models\\18500_generator_ema.pth' + load_path='X:\\dlas\\experiments\\train_music_cheater_gen_v5_cosine_40_lyr\\models\\19500_generator.pth' ).cuda() opt_eval = {'path': 'Y:\\split\\yt-music-eval', # eval music, mostly electronica. :) #'path': 'E:\\music_eval', # this is music from the training dataset, including a lot more variety. 'diffusion_steps': 128, # basis: 192 - 'conditioning_free': False, 'conditioning_free_k': 1, 'use_ddim': True, 'clip_audio': False, + 'conditioning_free': True, 'conditioning_free_k': 1, 'use_ddim': False, 'clip_audio': False, 'diffusion_schedule': 'cosine', 'diffusion_type': 'cheater_gen', # Slope 1: 1.03x, 2: 1.06, 4: 1.135, 8: 1.27, 16: 1.54 #'causal': True, 'causal_slope': 4, # DONT FORGET TO INCREMENT THE STEP! #'partial_low': 128, 'partial_high': 192 } - env = {'rank': 0, 'base_path': 'D:\\tmp\\test_eval_music', 'step': 201, 'device': 'cuda', 'opt': {}} + env = {'rank': 0, 'base_path': 'D:\\tmp\\test_eval_music', 'step': 204, 'device': 'cuda', 'opt': {}} eval = MusicDiffusionFid(diffusion, opt_eval, env) fds = [] for i in range(2): diff --git a/codes/trainer/injectors/audio_injectors.py b/codes/trainer/injectors/audio_injectors.py index fc81421e..faecf4ad 100644 --- a/codes/trainer/injectors/audio_injectors.py +++ b/codes/trainer/injectors/audio_injectors.py @@ -122,7 +122,7 @@ class RandomAudioCropInjector(Injector): else: len = inp.shape[-1] - margin = len - crop_sz - self.min_buffer + margin = len - crop_sz - self.min_buffer * 2 if margin < 0: start = self.min_buffer else: