diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-07-22 00:23:11 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-07-22 00:23:11 +0200 |
commit | b8158c02900b64f9356e05a2548e15f85f4545f4 (patch) | |
tree | b81f74d974b84a26d77c7de1dd9b80187bec5947 /training/conf/network/conv_transformer.yaml | |
parent | 9cfd991576cbbc9d005feba93a2a8c9d8f58cb52 (diff) |
Update conv transformer conf
Diffstat (limited to 'training/conf/network/conv_transformer.yaml')
-rw-r--r-- | training/conf/network/conv_transformer.yaml | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/training/conf/network/conv_transformer.yaml b/training/conf/network/conv_transformer.yaml index 24857c8..c4cf13e 100644 --- a/training/conf/network/conv_transformer.yaml +++ b/training/conf/network/conv_transformer.yaml @@ -1,6 +1,6 @@ _target_: text_recognizer.networks.ConvTransformer input_dims: [1, 1, 576, 640] -hidden_dim: &hidden_dim 144 +hidden_dim: &hidden_dim 96 num_classes: 58 pad_index: 3 encoder: @@ -19,9 +19,9 @@ decoder: self_attn: _target_: text_recognizer.networks.transformer.Attention dim: *hidden_dim - num_heads: 8 + num_heads: 12 dim_head: 64 - dropout_rate: &dropout_rate 0.4 + dropout_rate: &dropout_rate 0.2 causal: true rotary_embedding: _target_: text_recognizer.networks.transformer.RotaryEmbedding |