fix booboo

2022-07-24 18:00:14 -06:00 · 2022-07-24 18:00:14 -06:00 · 45afefabed
commit 45afefabed
parent cc62ba9cba
1 changed files with 1 additions and 1 deletions
--- a/codes/models/audio/music/transformer_diffusion13.py
+++ b/codes/models/audio/music/transformer_diffusion13.py
@ -273,7 +273,7 @@ class TransformerDiffusion(nn.Module):
        return groups

    def before_step(self, step):
-        scaled_grad_parameters = list(itertools.chain.from_iterable([lyr.out.parameters() for lyr in self.diff.layers]))
+        scaled_grad_parameters = list(itertools.chain.from_iterable([lyr.out.parameters() for lyr in self.layers]))
        # Scale back the gradients of the blkout and prenorm layers by a constant factor. These get two orders of magnitudes
        # higher gradients. Ideally we would use parameter groups, but ZeroRedundancyOptimizer makes this trickier than
        # directly fiddling with the gradients.