diff options
Diffstat (limited to 'training')
| -rw-r--r-- | training/conf/experiment/conv_transformer_lines.yaml | 2 | ||||
| -rw-r--r-- | training/conf/experiment/conv_transformer_paragraphs.yaml | 11 | 
2 files changed, 11 insertions, 2 deletions
diff --git a/training/conf/experiment/conv_transformer_lines.yaml b/training/conf/experiment/conv_transformer_lines.yaml index fe9ef6e..6c266b8 100644 --- a/training/conf/experiment/conv_transformer_lines.yaml +++ b/training/conf/experiment/conv_transformer_lines.yaml @@ -113,7 +113,7 @@ network:      dim: *hidden_dim      heads: 4      shape: *shape -    depth: 2 +    depth: 1      dim_head: 64      dim_index: 1 diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml index d2916e1..4f15ef2 100644 --- a/training/conf/experiment/conv_transformer_paragraphs.yaml +++ b/training/conf/experiment/conv_transformer_paragraphs.yaml @@ -18,6 +18,7 @@ summary: [[1, 1, 576, 640], [1, 682]]  criterion:    ignore_index: *ignore_index +  label_smoothing: 0.1  mapping: &mapping    mapping: @@ -108,7 +109,15 @@ network:    pixel_pos_embedding:      _target_: text_recognizer.networks.transformer.embeddings.axial.AxialPositionalEmbedding      dim: *hidden_dim -    shape: [18, 20] +    shape: &shape [36, 40] +  axial_encoder: +    _target_: text_recognizer.networks.transformer.axial_attention.encoder.AxialEncoder +    dim: *hidden_dim +    heads: 4 +    shape: *shape +    depth: 1 +    dim_head: 64 +    dim_index: 1  model:    _target_: text_recognizer.models.transformer.TransformerLitModel  |