add top_k sampling / offset for prompt similar utterance sampling
This commit is contained in:
parent
9da630f73a
commit
f24547ad4e
|
@ -158,6 +158,8 @@ class Dataset:
|
|||
max_resps: int = 1 # number of samples to target for training
|
||||
p_resp_append: float = 1.0 # probability to append another sample to the training target
|
||||
p_resp_pad_silence: float = 0.0 # probability to pad resp with silence to fit within the next window
|
||||
prompt_similar_top_k: int = 1
|
||||
prompt_similar_top_k_offset: int = 0
|
||||
|
||||
sample_type: str = "path" # path | speaker
|
||||
sample_order: str = "interleaved" # duration
|
||||
|
|
|
@ -880,7 +880,10 @@ class Dataset(_Dataset):
|
|||
return path, text, resps
|
||||
|
||||
# icky slop
|
||||
def get_similar_utterance(self, path, offset=0 ):
|
||||
def get_similar_utterance(self, path, offset=None ):
|
||||
if offset is None:
|
||||
offset = cfg.dataset.prompt_similar_top_k_offset
|
||||
|
||||
reference = path.name
|
||||
|
||||
if cfg.dataset.use_hdf5:
|
||||
|
@ -904,6 +907,11 @@ class Dataset(_Dataset):
|
|||
offset = 0
|
||||
|
||||
metadata_keys = list(metadata.keys())
|
||||
|
||||
if cfg.dataset.prompt_similar_top_k > 1:
|
||||
indices = reference_metadata["similar"][offset:offset+cfg.dataset.prompt_similar_top_k]
|
||||
index = random.choice( indices )
|
||||
else:
|
||||
index = reference_metadata["similar"][offset]
|
||||
name = metadata_keys[index]
|
||||
|
||||
|
|
Loading…
Reference in New Issue
Block a user