From 3ea8a610d66c1830a2f0955ce83406142e40d608 Mon Sep 17 00:00:00 2001 From: mrq Date: Wed, 13 Nov 2024 14:27:15 -0600 Subject: [PATCH] fix STT --- vall_e/models/base.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/vall_e/models/base.py b/vall_e/models/base.py index a76d64f..f9f495b 100755 --- a/vall_e/models/base.py +++ b/vall_e/models/base.py @@ -1174,9 +1174,9 @@ class Base(nn.Module): # we do a manual sum because I trained it to use the AR embeddings + NAR embeddings for STT...... embedding = sum([ self.resps_emb( input[:, :l+1], - #offset = 0 if l == 0 else 1, # or maybe set to 1 - #quant_level = l, - name = 'AR:0:0' if l == 0 else f'NAR:{l-1}:{l}', + offset = 0 if l == 0 else 1, # or maybe set to 1 + quant_level = l, + #name = 'AR:0:0' if l == 0 else f'NAR:{l-1}:{l}', sums = False ) for l in range( input.shape[-1] - 1 ) ]) else: