From a3b7260514bab2c0352c191937bf3758cce4f94d Mon Sep 17 00:00:00 2001 From: mrq Date: Thu, 13 Feb 2025 16:11:39 -0600 Subject: [PATCH] ugh --- vall_e/models/base.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/vall_e/models/base.py b/vall_e/models/base.py index b4fb2ae..acc70e8 100755 --- a/vall_e/models/base.py +++ b/vall_e/models/base.py @@ -735,8 +735,8 @@ class Base(nn.Module): if self.version >= 6: self.raw_text_emb = Embedding(self.n_raw_text_tokens, d_model) - self.resp_parallel_training = True # - self.monolithic_audio_encoder = True # + self.resp_parallel_training = True # governs if all levels are trained in parallel or one per sample like the old way + self.monolithic_audio_encoder = False # monolithic sounds bad if self.version >= 7: pd_model = d_model // 4 pd_ffn = pd_model * 4