Merge pull request #46 from sunyt32/retnet-official

Update epsilon in retention
This commit is contained in:
Shuming Ma 2023-08-02 14:07:44 +08:00 committed by GitHub
commit 7d231743f4
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -67,7 +67,7 @@ class MultiScaleRetention(nn.Module):
self.out_proj = MultiwayWrapper(args, nn.Linear(embed_dim * self.factor, embed_dim, bias=True))
self.group_norm = MultiwayWrapper(args, LayerNorm(self.head_dim, eps=args.layernorm_eps, elementwise_affine=False))
self.group_norm = MultiwayWrapper(args, LayerNorm(self.head_dim, eps=1e-6, elementwise_affine=False))
self.reset_parameters()
def reset_parameters(self):