Optimizing graphics card memory

During inference it does not store gradients, which take up most of the video memory
2022-05-11 16:35:11 +03:00 · 2022-05-11 16:35:11 +03:00 · cc38333249
commit cc38333249
parent ea8c825ee0
1 changed files with 22 additions and 21 deletions
--- a/tortoise/api.py
+++ b/tortoise/api.py
@ -225,6 +225,7 @@ class TextToSpeech:
        properties.
        :param voice_samples: List of 2 or more ~10 second reference clips, which should be torch tensors containing 22.05kHz waveform data.
        """
+        with torch.no_grad():
            voice_samples = [v.to('cuda') for v in voice_samples]

            auto_conds = []