summaryrefslogtreecommitdiff
path: root/training/conf
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2021-10-24 00:58:36 +0200
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2021-10-24 00:58:36 +0200
commitbdc85d2417a12e2978957156076eaaeff7e28999 (patch)
tree05a52550599fbc3efa7ad1df597fb55ff4c83689 /training/conf
parent914e5958d168355195f2eec0169da687395bde2a (diff)
Update configs
Diffstat (limited to 'training/conf')
-rw-r--r--training/conf/experiment/barlow_twins.yaml8
-rw-r--r--training/conf/experiment/cnn_htr_char_lines.yaml5
2 files changed, 6 insertions, 7 deletions
diff --git a/training/conf/experiment/barlow_twins.yaml b/training/conf/experiment/barlow_twins.yaml
index cb5035b..e3586bf 100644
--- a/training/conf/experiment/barlow_twins.yaml
+++ b/training/conf/experiment/barlow_twins.yaml
@@ -15,8 +15,8 @@ summary: [[1, 1, 56, 1024]]
criterion:
_target_: text_recognizer.criterions.barlow_twins.BarlowTwinsLoss
- dim: 512
- lambda_: 5.1e-3
+ dim: 2048
+ lambda_: 3.9e-3
callbacks:
stochastic_weight_averaging:
@@ -79,7 +79,7 @@ network:
bn_eps: 1.0e-3
projector:
_target_: text_recognizer.networks.barlow_twins.projector.Projector
- dims: [1280, 512, 512, 512]
+ dims: [1280, 2048, 2048]
model:
_target_: text_recognizer.models.barlow_twins.BarlowTwinsLitModel
@@ -100,5 +100,5 @@ trainer:
limit_val_batches: 1.0
limit_test_batches: 1.0
resume_from_checkpoint: null
- accumulate_grad_batches: 16
+ accumulate_grad_batches: 64
overfit_batches: 0
diff --git a/training/conf/experiment/cnn_htr_char_lines.yaml b/training/conf/experiment/cnn_htr_char_lines.yaml
index 53f6d91..682f138 100644
--- a/training/conf/experiment/cnn_htr_char_lines.yaml
+++ b/training/conf/experiment/cnn_htr_char_lines.yaml
@@ -18,8 +18,8 @@ criterion:
smoothing: 0.1
ignore_index: *ignore_index
-mapping:
- mapping: &mapping
+mapping: &mapping
+ mapping:
_target_: text_recognizer.data.emnist_mapping.EmnistMapping
callbacks:
@@ -38,7 +38,6 @@ optimizers:
momentum: 0.9
weight_decay: 0
eps: 1.0e-6
-
parameters: network
lr_schedulers: