Update epsilon in retention

This commit is contained in:
sunyt32 2023-08-02 05:38:30 +00:00
parent 5356b252c4
commit 2c29de0fb3

View File

@ -67,7 +67,7 @@ class MultiScaleRetention(nn.Module):
self.out_proj = MultiwayWrapper(args, nn.Linear(embed_dim * self.factor, embed_dim, bias=True))
self.group_norm = MultiwayWrapper(args, LayerNorm(self.head_dim, eps=args.layernorm_eps, elementwise_affine=False))
self.group_norm = MultiwayWrapper(args, LayerNorm(self.head_dim, eps=1e-6, elementwise_affine=False))
self.reset_parameters()
def reset_parameters(self):