tweaked tts-continuous task
This commit is contained in:
parent
21e5d250cc
commit
71e68a8528
|
@ -314,12 +314,14 @@ class Dataset(_Dataset):
|
||||||
# text-to-speech
|
# text-to-speech
|
||||||
if task == "tts" or task == "tts-c":
|
if task == "tts" or task == "tts-c":
|
||||||
trim_length = int(cfg.dataset.prompt_duration * 75)
|
trim_length = int(cfg.dataset.prompt_duration * 75)
|
||||||
continuous = task == "tts-c" and trim_length * 2 < resps.shape[0]
|
# demote if the target is too short
|
||||||
|
if task == "tts-c" and trim_length * 2 >= resps.shape[0]:
|
||||||
|
task = "tts"
|
||||||
|
|
||||||
# VALL-E continuous
|
# VALL-E continuous
|
||||||
# ignore if target utterance is shorter than prompt duration
|
# ignore if target utterance is shorter than prompt duration
|
||||||
# to-do: actually do this for the AR only as I don't think the paper trained the NAR for this
|
# to-do: actually do this for the AR only as I don't think the paper trained the NAR for this
|
||||||
if continuous:
|
if task == "tts-c":
|
||||||
proms = resps[:trim_length, :]
|
proms = resps[:trim_length, :]
|
||||||
resps = resps[trim_length:, :]
|
resps = resps[trim_length:, :]
|
||||||
else:
|
else:
|
||||||
|
|
Loading…
Reference in New Issue
Block a user