fix call to activation_fn

2022-11-29 00:11:38 +01:00 · 2022-11-29 00:11:38 +01:00 · c69aba2a73
commit c69aba2a73
parent be14bc23a1
1 changed files with 2 additions and 2 deletions
--- a/examples/fairseq/models/bert.py
+++ b/examples/fairseq/models/bert.py
@ -391,7 +391,7 @@ class ClassificationHead(nn.Module):
        x = features[:, 0, :]  # take <s> token (equiv. to [CLS])
        x = self.dropout(x)
        x = self.dense(x)
-        x = self.activation_fn(x)
+        x = self.activation_fn(x.float()).as_type(x)
        x = self.dropout(x)
        x = self.out_proj(x)
        return x
@ -418,7 +418,7 @@ class LMHead(nn.Module):
            features = features[masked_tokens, :]

        x = self.dense(features)
-        x = self.activation_fn(x)
+        x = self.activation_fn(x.float()).as_type(x)
        x = self.layer_norm(x)
        # project back to size of vocabulary with bias
        x = F.linear(x, self.weight) + self.bias