This commit is contained in:
mrq 2024-11-18 14:12:26 -06:00
parent 4a71981456
commit 2b29790173
2 changed files with 3 additions and 0 deletions

View File

@ -714,6 +714,7 @@ class Dataset(_Dataset):
for key in keys:
if len(self.paths_by_spkr_name[key]) < cfg.dataset.min_utterances:
del self.paths_by_spkr_name[key]
continue
# slice away extraneous utterances
if cfg.dataset.max_utterances:

View File

@ -263,6 +263,8 @@ class AR_NAR(Base):
null_prom = [ None for _ in range(batch_size) ]
prev_list = resps_list
# to-do: only do the Nth first tokens, then the Nth seconds tokens, etc. until the last window
# because for longer utterances it absolutely degrades
for timestep in tqdm(torch.linspace(start_noise, end_noise, max_steps), desc="NAR Masked", disable=disable_tqdm):
# ramp down over time
annealing = 1.0 - timestep