diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-06-15 00:15:40 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-06-15 00:15:40 +0200 |
commit | 2c9066b685d41ef0ab5ea94e938b8a30b4123656 (patch) | |
tree | 341e8d0d73cdde0fe4908421a5e9fd34f16cd8c3 /training/conf/network/decoder | |
parent | 8bb76745e43c6b4967c8e91ebaf4c4295d0b8d0b (diff) |
Update configs
Diffstat (limited to 'training/conf/network/decoder')
-rw-r--r-- | training/conf/network/decoder/transformer_decoder.yaml | 30 |
1 files changed, 0 insertions, 30 deletions
diff --git a/training/conf/network/decoder/transformer_decoder.yaml b/training/conf/network/decoder/transformer_decoder.yaml deleted file mode 100644 index 4588ee9..0000000 --- a/training/conf/network/decoder/transformer_decoder.yaml +++ /dev/null @@ -1,30 +0,0 @@ -_target_: text_recognizer.networks.transformer.decoder.Decoder -depth: 4 -block: - _target_: text_recognizer.networks.transformer.decoder.DecoderBlock - self_attn: - _target_: text_recognizer.networks.transformer.attention.Attention - dim: 64 - num_heads: 4 - dim_head: 64 - dropout_rate: 0.05 - causal: true - rotary_embedding: - _target_: text_recognizer.networks.transformer.embeddings.rotary.RotaryEmbedding - dim: 128 - cross_attn: - _target_: text_recognizer.networks.transformer.attention.Attention - dim: 64 - num_heads: 4 - dim_head: 64 - dropout_rate: 0.05 - causal: false - norm: - _target_: text_recognizer.networks.transformer.norm.RMSNorm - normalized_shape: 192 - ff: - _target_: text_recognizer.networks.transformer.mlp.FeedForward - dim_out: null - expansion_factor: 4 - glu: true - dropout_rate: 0.2 |