diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-06-20 00:57:18 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-06-20 00:57:18 +0200 |
commit | b76e27e895405dbaaf50c828817a71c9ec939de0 (patch) | |
tree | 441ad54f4689ee5c02d291e7b4f01edf9c0fa7c1 /training/conf | |
parent | 598fd271942884f852e98c82d6caedad425813a1 (diff) |
Update paragraph experiment
Diffstat (limited to 'training/conf')
-rw-r--r-- | training/conf/experiment/conv_transformer_paragraphs.yaml | 10 |
1 files changed, 5 insertions, 5 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml index af27a9e..d3311fd 100644 --- a/training/conf/experiment/conv_transformer_paragraphs.yaml +++ b/training/conf/experiment/conv_transformer_paragraphs.yaml @@ -40,7 +40,7 @@ lr_scheduler: max_lr: 3.0e-4 total_steps: null epochs: *epochs - steps_per_epoch: 5037 + steps_per_epoch: 3358 pct_start: 0.15 anneal_strategy: cos cycle_momentum: true @@ -55,7 +55,7 @@ lr_scheduler: monitor: val/cer datamodule: - batch_size: 4 + batch_size: 6 train_fraction: 0.95 network: @@ -63,9 +63,9 @@ network: num_classes: *num_classes pad_index: *ignore_index encoder: - depth: 5 + depth: 6 decoder: - depth: 4 + depth: 5 pixel_embedding: shape: [18, 80] @@ -75,4 +75,4 @@ model: trainer: gradient_clip_val: 0.5 max_epochs: *epochs - accumulate_grad_batches: 2 + accumulate_grad_batches: 1 |