From bee2688deae12863d71f1ff098afb9434f949d8e Mon Sep 17 00:00:00 2001 From: mrq Date: Sat, 15 Mar 2025 16:50:21 -0500 Subject: [PATCH] ugh --- vall_e/data.py | 7 +++---- vall_e/train.py | 2 +- 2 files changed, 4 insertions(+), 5 deletions(-) diff --git a/vall_e/data.py b/vall_e/data.py index 92f078a..fb5bfdb 100755 --- a/vall_e/data.py +++ b/vall_e/data.py @@ -853,10 +853,9 @@ class Dataset(_Dataset): self.metadata = _load_dataset_metadata(self.dataset, self.dataset_type, dataset_hash_key=self.dataset_hash_key) # cull speakers with too little utterances - for speaker in self.metadata.keys(): - utterances = len(self.metadata[speaker]) - if utterances < cfg.dataset.min_utterances: - del self.metadata[speaker] + prune_keys = [ speaker for speaker in self.metadata.keys() if len(self.metadata[speaker]) < cfg.dataset.min_utterances ] + for speaker in prune_keys: + del self.metadata[speaker] self.paths = [] self.speakers = list(self.metadata.keys()) diff --git a/vall_e/train.py b/vall_e/train.py index 260a5e7..fd90d95 100755 --- a/vall_e/train.py +++ b/vall_e/train.py @@ -122,7 +122,7 @@ def run_eval(engines, eval_name, dl, args=None): return def process( name, batch, resps_list ): - for speaker, path, ref, hyp, prom, task in zip(batch["spkr_name"], batch["path"], batch["resps"], resps_list, batch["proms"], batch["task"]): + for speaker, path, ref, hyp, prom, task in zip(batch["speaker_name"], batch["path"], batch["resps"], resps_list, batch["proms"], batch["task"]): if len(hyp) == 0: continue