summaryrefslogtreecommitdiff
path: root/training/conf/network/conformer.yaml
diff options
context:
space:
mode:
Diffstat (limited to 'training/conf/network/conformer.yaml')
-rw-r--r--training/conf/network/conformer.yaml36
1 files changed, 36 insertions, 0 deletions
diff --git a/training/conf/network/conformer.yaml b/training/conf/network/conformer.yaml
new file mode 100644
index 0000000..1d72dd5
--- /dev/null
+++ b/training/conf/network/conformer.yaml
@@ -0,0 +1,36 @@
+_target_: text_recognizer.networks.conformer.Conformer
+depth: 8
+num_classes: 57
+dim: &dim 144
+dim_gru: 144
+block:
+ _target_: text_recognizer.networks.conformer.ConformerBlock
+ dim: *dim
+ attn:
+ _target_: text_recognizer.networks.conformer.Attention
+ dim: *dim
+ heads: 8
+ dim_head: 64
+ mult: 4
+ ff:
+ _target_: text_recognizer.networks.conformer.Feedforward
+ dim: *dim
+ expansion_factor: 4
+ dropout: 0.1
+ conv:
+ _target_: text_recognizer.networks.conformer.ConformerConv
+ dim: *dim
+ expansion_factor: 2
+ kernel_size: 31
+ dropout: 0.1
+subsampler:
+ _target_: text_recognizer.networks.conformer.Subsampler
+ pixel_pos_embedding:
+ _target_: text_recognizer.networks.transformer.AxialPositionalEmbedding
+ dim: 64
+ shape: [6, 127]
+ channels: 64
+ height: 6
+ dim: *dim
+ depth: 3
+ dropout: 0.1