diff --git a/vall_e/emb/similar.py b/vall_e/emb/similar.py index 3992dae..8936094 100644 --- a/vall_e/emb/similar.py +++ b/vall_e/emb/similar.py @@ -195,7 +195,7 @@ def process( sorted_similarities = {} - for index, filename in tqdm(enumerate(keys), total=len(keys), desc=f"Computing similarities: {speaker_path.name}"): + for index, filename in tqdm(enumerate(keys), total=len(keys), desc=f"Computing similarities: {speaker_path.name}", disable=not verbose): if features[filename] is None: continue @@ -241,7 +241,7 @@ def main(): args = parser.parse_args() - args.skip_existing = False # + args.skip_existing = True # if args.use_dataset: cfg.metadata_dir.mkdir(parents=True, exist_ok=True) @@ -278,7 +278,7 @@ def main(): dtype=args.dtype, amp=args.amp, - verbose=True, + verbose=False, ) if not similarities: diff --git a/vall_e/engines/__init__.py b/vall_e/engines/__init__.py index ffe51ad..0feec2e 100755 --- a/vall_e/engines/__init__.py +++ b/vall_e/engines/__init__.py @@ -188,6 +188,7 @@ def load_engines(training=True, **model_kwargs): keys = [ ("text_emb.weight", model.config.text_tokens ), ("tasks_emb.weight", model.config.tasks ), + ("langs_emb.weight", model.config.langs ), ("rvq_l_emb.weight", model.config.resp_levels + (1 if "len" in model.config.capabilities else 0) ), ("resps_emb.embeddings.0.weight", model.config.audio_tokens + uses_stop_token ), ("model.embed_tokens.weight", model.config.audio_tokens + uses_stop_token ),