my DAC dataset again managed to only have some utterances with only 8 of 9 RVQ levels, this fixes an oversight from it

2024-08-09 21:18:01 -05:00 · 2024-08-09 21:18:01 -05:00 · 054d28573a
commit 054d28573a
parent 2a1794c084
1 changed files with 1 additions and 1 deletions
--- a/vall_e/emb/qnt.py
+++ b/vall_e/emb/qnt.py
@ -682,7 +682,7 @@ def pad_codes_with_silence( codes, size=1 ):
 	duration = codes.shape[0] * get_framerate()
 	difference = math.ceil( duration + size ) - duration

-	silence = get_silence( difference, device=codes.device )
+	silence = get_silence( difference, device=codes.device )[:, :codes.shape[-1]]

 	half = math.floor(difference / 2 * get_framerate())