diff --git a/vall_e/models/base.py b/vall_e/models/base.py index b4fb2ae..acc70e8 100755 --- a/vall_e/models/base.py +++ b/vall_e/models/base.py @@ -735,8 +735,8 @@ class Base(nn.Module): if self.version >= 6: self.raw_text_emb = Embedding(self.n_raw_text_tokens, d_model) - self.resp_parallel_training = True # - self.monolithic_audio_encoder = True # + self.resp_parallel_training = True # governs if all levels are trained in parallel or one per sample like the old way + self.monolithic_audio_encoder = False # monolithic sounds bad if self.version >= 7: pd_model = d_model // 4 pd_ffn = pd_model * 4