From 9c7598dc9a8bebdb859fd58edb518e1b9dd58e10 Mon Sep 17 00:00:00 2001 From: James Betker Date: Mon, 21 Mar 2022 15:29:17 -0600 Subject: [PATCH] fix conditioning_free signal --- codes/models/audio/tts/unet_diffusion_tts_flat.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/codes/models/audio/tts/unet_diffusion_tts_flat.py b/codes/models/audio/tts/unet_diffusion_tts_flat.py index 714f5a03..699585e0 100644 --- a/codes/models/audio/tts/unet_diffusion_tts_flat.py +++ b/codes/models/audio/tts/unet_diffusion_tts_flat.py @@ -158,7 +158,7 @@ class DiffusionTtsFlat(nn.Module): # Note: this block does not need to repeated on inference, since it is not timestep-dependent or x-dependent. unused_params = [] if conditioning_free: - code_emb = self.unconditioned_embedding.repeat(x.shape[0], 1, 1) + code_emb = self.unconditioned_embedding.repeat(conditioning_input.shape[0], 1, 1) else: unused_params.append(self.unconditioned_embedding) cond_emb = self.contextual_embedder(conditioning_input)