Merge pull request #46 from sunyt32/retnet-official
Update epsilon in retention
This commit is contained in:
commit
7d231743f4
|
@ -67,7 +67,7 @@ class MultiScaleRetention(nn.Module):
|
|||
|
||||
self.out_proj = MultiwayWrapper(args, nn.Linear(embed_dim * self.factor, embed_dim, bias=True))
|
||||
|
||||
self.group_norm = MultiwayWrapper(args, LayerNorm(self.head_dim, eps=args.layernorm_eps, elementwise_affine=False))
|
||||
self.group_norm = MultiwayWrapper(args, LayerNorm(self.head_dim, eps=1e-6, elementwise_affine=False))
|
||||
self.reset_parameters()
|
||||
|
||||
def reset_parameters(self):
|
||||
|
|
Loading…
Reference in New Issue
Block a user