summaryrefslogtreecommitdiff
path: root/training/conf/experiment/conv_transformer_paragraphs.yaml
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2022-06-20 00:57:18 +0200
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2022-06-20 00:57:18 +0200
commitb76e27e895405dbaaf50c828817a71c9ec939de0 (patch)
tree441ad54f4689ee5c02d291e7b4f01edf9c0fa7c1 /training/conf/experiment/conv_transformer_paragraphs.yaml
parent598fd271942884f852e98c82d6caedad425813a1 (diff)
Update paragraph experiment
Diffstat (limited to 'training/conf/experiment/conv_transformer_paragraphs.yaml')
-rw-r--r--training/conf/experiment/conv_transformer_paragraphs.yaml10
1 files changed, 5 insertions, 5 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml
index af27a9e..d3311fd 100644
--- a/training/conf/experiment/conv_transformer_paragraphs.yaml
+++ b/training/conf/experiment/conv_transformer_paragraphs.yaml
@@ -40,7 +40,7 @@ lr_scheduler:
max_lr: 3.0e-4
total_steps: null
epochs: *epochs
- steps_per_epoch: 5037
+ steps_per_epoch: 3358
pct_start: 0.15
anneal_strategy: cos
cycle_momentum: true
@@ -55,7 +55,7 @@ lr_scheduler:
monitor: val/cer
datamodule:
- batch_size: 4
+ batch_size: 6
train_fraction: 0.95
network:
@@ -63,9 +63,9 @@ network:
num_classes: *num_classes
pad_index: *ignore_index
encoder:
- depth: 5
+ depth: 6
decoder:
- depth: 4
+ depth: 5
pixel_embedding:
shape: [18, 80]
@@ -75,4 +75,4 @@ model:
trainer:
gradient_clip_val: 0.5
max_epochs: *epochs
- accumulate_grad_batches: 2
+ accumulate_grad_batches: 1