Update configs

author: Gustaf Rydholm <gustaf.rydholm@gmail.com> 2022-06-22 22:27:17 +0200
committer: Gustaf Rydholm <gustaf.rydholm@gmail.com> 2022-06-22 22:27:17 +0200
commit: a30acba378f6f8fb86bb1a6096b9eb0ae7a68449 (patch)
tree: c4a1087520a05a1f0bc792887b1ab51694a59b84 /training/conf/experiment
parent: 1d592a432e57eadff0b94f945e59cbeb95e6a3f0 (diff)
1 files changed, 15 insertions, 20 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml
index 80f6ce6..41c236d 100644
--- a/training/conf/experiment/conv_transformer_paragraphs.yaml
+++ b/training/conf/experiment/conv_transformer_paragraphs.yaml
@@ -41,26 +41,21 @@ optimizer:
   eps: 1.0e-8
 
 lr_scheduler:
-  _target_: torch.optim.lr_scheduler.OneCycleLR
-  max_lr: 3.0e-4
-  total_steps: null
-  epochs: *epochs
-  steps_per_epoch: 3358
-  pct_start: 0.1
-  anneal_strategy: cos
-  cycle_momentum: true
-  base_momentum: 0.85
-  max_momentum: 0.95
-  div_factor: 25.0
-  final_div_factor: 10000.0
-  three_phase: true
-  last_epoch: -1
+  _target_: torch.optim.lr_scheduler.ReduceLROnPlateau
+  mode: min
+  factor: 0.8
+  patience: 10
+  threshold: 1.0e-4
+  threshold_mode: rel
+  cooldown: 0
+  min_lr: 1.0e-5
+  eps: 1.0e-8
   verbose: false
-  interval: step
+  interval: epoch
   monitor: val/cer
 
 datamodule:
-  batch_size: 6
+  batch_size: 8
   train_fraction: 0.95
 
 network:
@@ -68,16 +63,16 @@ network:
   num_classes: *num_classes
   pad_index: *ignore_index
   encoder:
-    depth: 6
-  decoder:
     depth: 4
+  decoder:
+    depth: 6
   pixel_embedding:
-    shape: [18, 80]
+    shape: [18, 79]
 
 model:
   max_output_len: *max_output_len
 
 trainer:
-  gradient_clip_val: 0.5
+  gradient_clip_val: 1.0
   max_epochs: *epochs
   accumulate_grad_batches: 1
author	Gustaf Rydholm <gustaf.rydholm@gmail.com>	2022-06-22 22:27:17 +0200
committer	Gustaf Rydholm <gustaf.rydholm@gmail.com>	2022-06-22 22:27:17 +0200
commit	a30acba378f6f8fb86bb1a6096b9eb0ae7a68449 (patch)
tree	c4a1087520a05a1f0bc792887b1ab51694a59b84 /training/conf/experiment
parent	1d592a432e57eadff0b94f945e59cbeb95e6a3f0 (diff)