diff options
Diffstat (limited to 'training')
-rw-r--r-- | training/conf/experiment/cnn_transformer_paragraphs.yaml | 2 | ||||
-rw-r--r-- | training/conf/experiment/cnn_transformer_paragraphs_wp.yaml | 2 |
2 files changed, 2 insertions, 2 deletions
diff --git a/training/conf/experiment/cnn_transformer_paragraphs.yaml b/training/conf/experiment/cnn_transformer_paragraphs.yaml index e9cd254..8feb1bc 100644 --- a/training/conf/experiment/cnn_transformer_paragraphs.yaml +++ b/training/conf/experiment/cnn_transformer_paragraphs.yaml @@ -49,7 +49,7 @@ lr_schedulers: max_lr: 2.0e-4 total_steps: null epochs: *epochs - steps_per_epoch: 79 + steps_per_epoch: 632 pct_start: 0.3 anneal_strategy: cos cycle_momentum: true diff --git a/training/conf/experiment/cnn_transformer_paragraphs_wp.yaml b/training/conf/experiment/cnn_transformer_paragraphs_wp.yaml index 6d2bbdb..1c9bba1 100644 --- a/training/conf/experiment/cnn_transformer_paragraphs_wp.yaml +++ b/training/conf/experiment/cnn_transformer_paragraphs_wp.yaml @@ -56,7 +56,7 @@ lr_schedulers: max_lr: 3.0e-4 total_steps: null epochs: *epochs - steps_per_epoch: 79 + steps_per_epoch: 632 pct_start: 0.3 anneal_strategy: cos cycle_momentum: true |