diff --git a/codes/scripts/audio/gen/speech_synthesis_utils.py b/codes/scripts/audio/gen/speech_synthesis_utils.py index d065efb9..4902db19 100644 --- a/codes/scripts/audio/gen/speech_synthesis_utils.py +++ b/codes/scripts/audio/gen/speech_synthesis_utils.py @@ -22,7 +22,7 @@ def load_speech_dvae(): def load_univnet_vocoder(): model = UnivNetGenerator() - sd = torch.load('../experiments/univnet_c32_pretrained_libri.pt') + sd = torch.load('../experiments/univnet_c32_pretrained_libri.pt', map_location='cpu') model.load_state_dict(sd['model_g']) model = model.cpu() model.eval(inference=True)