diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2021-11-05 19:28:01 +0100 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2021-11-05 19:28:01 +0100 |
commit | 632309bda9d27264992e5a9002290fae5f45e7ef (patch) | |
tree | b4ccb7ccfc64a25b7eed8a8444d4fa89d2ac5d97 /training | |
parent | 70540bf897df1d60375ea220cfab838cbd28c47f (diff) |
Update paragraphs config
Diffstat (limited to 'training')
-rw-r--r-- | training/conf/experiment/conv_transformer_paragraphs.yaml | 7 |
1 files changed, 3 insertions, 4 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml index e958367..00ad389 100644 --- a/training/conf/experiment/conv_transformer_paragraphs.yaml +++ b/training/conf/experiment/conv_transformer_paragraphs.yaml @@ -2,7 +2,7 @@ defaults: - override /mapping: null - - override /criterion: null + - override /criterion: cross_entropy - override /callbacks: htr - override /datamodule: iam_extended_paragraphs - override /network: null @@ -18,7 +18,6 @@ max_output_len: &max_output_len 682 summary: [[1, 1, 576, 640], [1, 682]] criterion: - _target_: torch.nn.CrossEntropyLoss ignore_index: *ignore_index mapping: &mapping @@ -50,7 +49,7 @@ lr_schedulers: max_lr: 1.0e-4 total_steps: null epochs: *epochs - steps_per_epoch: 722 + steps_per_epoch: 1264 pct_start: 0.01 anneal_strategy: cos cycle_momentum: true @@ -156,5 +155,5 @@ trainer: limit_val_batches: 1.0 limit_test_batches: 1.0 resume_from_checkpoint: null - accumulate_grad_batches: 7 + accumulate_grad_batches: 4 overfit_batches: 0 |