diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2021-10-27 22:43:17 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2021-10-27 22:43:17 +0200 |
commit | 80dcd02c52b11e944967e5e80a6562c4a8b3ed2e (patch) | |
tree | f03bf84db1f2bb641c76b32c37f1437fd2d997b0 /training | |
parent | 31209cc745e2602345eaf5ab6736acb3c9f1be56 (diff) |
Update conv transfromer experiment config
Diffstat (limited to 'training')
-rw-r--r-- | training/conf/experiment/conv_transformer_paragraphs.yaml | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml index 4de9722..8c3af44 100644 --- a/training/conf/experiment/conv_transformer_paragraphs.yaml +++ b/training/conf/experiment/conv_transformer_paragraphs.yaml @@ -50,7 +50,7 @@ lr_schedulers: max_lr: 1.0e-4 total_steps: null epochs: *epochs - steps_per_epoch: 316 + steps_per_epoch: 211 pct_start: 0.03 anneal_strategy: cos cycle_momentum: true @@ -66,7 +66,7 @@ lr_schedulers: datamodule: _target_: text_recognizer.data.iam_extended_paragraphs.IAMExtendedParagraphs - batch_size: 4 + batch_size: 6 num_workers: 12 train_fraction: 0.8 pin_memory: true @@ -75,7 +75,7 @@ datamodule: network: _target_: text_recognizer.networks.conv_transformer.ConvTransformer input_dims: [1, 576, 640] - hidden_dim: &hidden_dim 256 + hidden_dim: &hidden_dim 192 encoder_dim: 1280 dropout_rate: 0.1 num_classes: *num_classes |