summaryrefslogtreecommitdiff
path: root/training/conf/experiment/barlow_twins.yaml
diff options
context:
space:
mode:
Diffstat (limited to 'training/conf/experiment/barlow_twins.yaml')
-rw-r--r--training/conf/experiment/barlow_twins.yaml12
1 files changed, 5 insertions, 7 deletions
diff --git a/training/conf/experiment/barlow_twins.yaml b/training/conf/experiment/barlow_twins.yaml
index e3586bf..cc1295d 100644
--- a/training/conf/experiment/barlow_twins.yaml
+++ b/training/conf/experiment/barlow_twins.yaml
@@ -8,14 +8,12 @@ defaults:
- override /lr_schedulers: null
- override /optimizers: null
-
-print_config: true
epochs: &epochs 1000
summary: [[1, 1, 56, 1024]]
criterion:
_target_: text_recognizer.criterions.barlow_twins.BarlowTwinsLoss
- dim: 2048
+ dim: 512
lambda_: 3.9e-3
callbacks:
@@ -30,7 +28,7 @@ callbacks:
optimizers:
madgrad:
_target_: madgrad.MADGRAD
- lr: 3.0e-4
+ lr: 1.0e-3
momentum: 0.9
weight_decay: 1.0e-6
eps: 1.0e-6
@@ -61,7 +59,7 @@ datamodule:
_target_: text_recognizer.data.iam_lines.IAMLines
batch_size: 16
num_workers: 12
- train_fraction: 0.8
+ train_fraction: 0.9
pin_memory: false
transform: transform/iam_lines_barlow.yaml
test_transform: transform/iam_lines_barlow.yaml
@@ -79,7 +77,7 @@ network:
bn_eps: 1.0e-3
projector:
_target_: text_recognizer.networks.barlow_twins.projector.Projector
- dims: [1280, 2048, 2048]
+ dims: [1280, 512, 512, 512]
model:
_target_: text_recognizer.models.barlow_twins.BarlowTwinsLitModel
@@ -100,5 +98,5 @@ trainer:
limit_val_batches: 1.0
limit_test_batches: 1.0
resume_from_checkpoint: null
- accumulate_grad_batches: 64
+ accumulate_grad_batches: 32
overfit_batches: 0