diff options
author | John Bauer <horatio@gmail.com> | 2022-11-03 04:37:43 +0300 |
---|---|---|
committer | John Bauer <horatio@gmail.com> | 2022-11-03 04:37:43 +0300 |
commit | 9ca3186386b17e7505fe79c519ed676815bd0ffe (patch) | |
tree | 24741633eb78d74dd150f8bcc91fc180bd3e6dee | |
parent | 41a23f2c892a3903dab945f4e04fb55b0d0c8862 (diff) |
more heads? should run some experimentspattn_issue
-rw-r--r-- | stanza/models/constituency/lstm_model.py | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/stanza/models/constituency/lstm_model.py b/stanza/models/constituency/lstm_model.py index a7d354fe..4bf45d21 100644 --- a/stanza/models/constituency/lstm_model.py +++ b/stanza/models/constituency/lstm_model.py @@ -344,7 +344,7 @@ class LSTMModel(BaseModel, nn.Module): self.word_transform_size = self.hidden_size * 2 - encoder_layers = TransformerEncoderLayer(self.hidden_size * 2, 2, self.hidden_size * 2, 0.1, batch_first=True) + encoder_layers = TransformerEncoderLayer(self.hidden_size * 2, 8, self.hidden_size * 2, 0.1, batch_first=True) self.transformer_encoder = TransformerEncoder(encoder_layers, 1) self.partitioned_transformer_module = None |