From 28a674e0f16ee0521f3126e687324bb7dbc0cbcd Mon Sep 17 00:00:00 2001 From: mrq Date: Thu, 18 Jul 2024 23:25:32 -0500 Subject: [PATCH] fixes... --- vall_e/data.py | 103 +++++++++++++++++++++++++----------------- vall_e/emb/qnt.py | 19 ++++++-- vall_e/models/base.py | 34 +++++++++++--- 3 files changed, 105 insertions(+), 51 deletions(-) diff --git a/vall_e/data.py b/vall_e/data.py index d9d5c2a..34b0f22 100755 --- a/vall_e/data.py +++ b/vall_e/data.py @@ -275,6 +275,9 @@ def get_task_symmap(): "": 5, "": 6, "": 7, + + "": 6, # fake + "": 6, # fake } def _replace_file_extension(path, suffix): @@ -849,12 +852,12 @@ class Dataset(_Dataset): if f'<{task}>' not in self.task_symmap: raise Exception(f'Task not defined: {task}') - # Base TTS (text + prompt => output) + # Base TTS ( => ) if task == "tts": - proms = self.sample_prompts(spkr_name, ignore=path) if random.random() < cfg.dataset.random_utterance else resps + proms = self.sample_prompts(spkr_name, ignore=path) - # VALL-E Continuous (text + partial output => rest of output) - # (this could just be sampled as +