Update paragraph experiment

author: Gustaf Rydholm <gustaf.rydholm@gmail.com> 2022-06-20 00:57:18 +0200
committer: Gustaf Rydholm <gustaf.rydholm@gmail.com> 2022-06-20 00:57:18 +0200
commit: b76e27e895405dbaaf50c828817a71c9ec939de0 (patch)
tree: 441ad54f4689ee5c02d291e7b4f01edf9c0fa7c1 /training/conf
parent: 598fd271942884f852e98c82d6caedad425813a1 (diff)
1 files changed, 5 insertions, 5 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml
index af27a9e..d3311fd 100644
--- a/training/conf/experiment/conv_transformer_paragraphs.yaml
+++ b/training/conf/experiment/conv_transformer_paragraphs.yaml
@@ -40,7 +40,7 @@ lr_scheduler:
   max_lr: 3.0e-4
   total_steps: null
   epochs: *epochs
-  steps_per_epoch: 5037
+  steps_per_epoch: 3358
   pct_start: 0.15
   anneal_strategy: cos
   cycle_momentum: true
@@ -55,7 +55,7 @@ lr_scheduler:
   monitor: val/cer
 
 datamodule:
-  batch_size: 4
+  batch_size: 6
   train_fraction: 0.95
 
 network:
@@ -63,9 +63,9 @@ network:
   num_classes: *num_classes
   pad_index: *ignore_index
   encoder:
-    depth: 5
+    depth: 6
   decoder:
-    depth: 4
+    depth: 5
   pixel_embedding:
     shape: [18, 80]
 
@@ -75,4 +75,4 @@ model:
 trainer:
   gradient_clip_val: 0.5
   max_epochs: *epochs
-  accumulate_grad_batches: 2
+  accumulate_grad_batches: 1
author	Gustaf Rydholm <gustaf.rydholm@gmail.com>	2022-06-20 00:57:18 +0200
committer	Gustaf Rydholm <gustaf.rydholm@gmail.com>	2022-06-20 00:57:18 +0200
commit	b76e27e895405dbaaf50c828817a71c9ec939de0 (patch)
tree	441ad54f4689ee5c02d291e7b4f01edf9c0fa7c1 /training/conf
parent	598fd271942884f852e98c82d6caedad425813a1 (diff)