my DAC dataset again managed to only have some utterances with only 8 of 9 RVQ levels, this fixes an oversight from it

This commit is contained in:
mrq 2024-08-09 21:18:01 -05:00
parent 2a1794c084
commit 054d28573a

View File

@ -682,7 +682,7 @@ def pad_codes_with_silence( codes, size=1 ):
duration = codes.shape[0] * get_framerate()
difference = math.ceil( duration + size ) - duration
silence = get_silence( difference, device=codes.device )
silence = get_silence( difference, device=codes.device )[:, :codes.shape[-1]]
half = math.floor(difference / 2 * get_framerate())