diff options
Diffstat (limited to 'training')
-rw-r--r-- | training/conf/experiment/conv_transformer_paragraphs.yaml | 7 |
1 files changed, 3 insertions, 4 deletions
diff --git a/training/conf/experiment/conv_transformer_paragraphs.yaml b/training/conf/experiment/conv_transformer_paragraphs.yaml index e958367..00ad389 100644 --- a/training/conf/experiment/conv_transformer_paragraphs.yaml +++ b/training/conf/experiment/conv_transformer_paragraphs.yaml @@ -2,7 +2,7 @@ defaults: - override /mapping: null - - override /criterion: null + - override /criterion: cross_entropy - override /callbacks: htr - override /datamodule: iam_extended_paragraphs - override /network: null @@ -18,7 +18,6 @@ max_output_len: &max_output_len 682 summary: [[1, 1, 576, 640], [1, 682]] criterion: - _target_: torch.nn.CrossEntropyLoss ignore_index: *ignore_index mapping: &mapping @@ -50,7 +49,7 @@ lr_schedulers: max_lr: 1.0e-4 total_steps: null epochs: *epochs - steps_per_epoch: 722 + steps_per_epoch: 1264 pct_start: 0.01 anneal_strategy: cos cycle_momentum: true @@ -156,5 +155,5 @@ trainer: limit_val_batches: 1.0 limit_test_batches: 1.0 resume_from_checkpoint: null - accumulate_grad_batches: 7 + accumulate_grad_batches: 4 overfit_batches: 0 |