diff --git a/codes/models/asr/w2v_wrapper.py b/codes/models/asr/w2v_wrapper.py index b5bf5737..e2ef8ddb 100644 --- a/codes/models/asr/w2v_wrapper.py +++ b/codes/models/asr/w2v_wrapper.py @@ -30,7 +30,7 @@ class Wav2VecWrapper(nn.Module): self.w2v.lm_head = nn.Linear(self.w2v.config.hidden_size, vocab_size) self.w2v.config.vocab_size = vocab_size self.w2v.config.pad_token_id = 0 - self.w2v.config.ctc_loss_reduction = 'mean' + self.w2v.config.ctc_loss_reduction = 'sum' self.w2v.config.apply_spec_augment = spec_augment # We always freeze the feature extractor, which needs some special operations in DLAS