summaryrefslogtreecommitdiff
path: root/training/conf/datamodule
diff options
context:
space:
mode:
Diffstat (limited to 'training/conf/datamodule')
-rw-r--r--training/conf/datamodule/target_transform/word_piece.yaml3
-rw-r--r--training/conf/datamodule/target_transform/word_piece_iam.yaml3
-rw-r--r--training/conf/datamodule/target_transform/word_pieces.yaml3
-rw-r--r--training/conf/datamodule/transform/barlow_paragraphs.yaml46
4 files changed, 52 insertions, 3 deletions
diff --git a/training/conf/datamodule/target_transform/word_piece.yaml b/training/conf/datamodule/target_transform/word_piece.yaml
new file mode 100644
index 0000000..bf284fb
--- /dev/null
+++ b/training/conf/datamodule/target_transform/word_piece.yaml
@@ -0,0 +1,3 @@
+word_piece:
+ _target_: text_recognizer.data.transforms.word_piece.WordPiece
+ max_len: 451
diff --git a/training/conf/datamodule/target_transform/word_piece_iam.yaml b/training/conf/datamodule/target_transform/word_piece_iam.yaml
new file mode 100644
index 0000000..478987c
--- /dev/null
+++ b/training/conf/datamodule/target_transform/word_piece_iam.yaml
@@ -0,0 +1,3 @@
+word_piece:
+ _target_: text_recognizer.data.transforms.word_piece.WordPiece
+ max_len: 72
diff --git a/training/conf/datamodule/target_transform/word_pieces.yaml b/training/conf/datamodule/target_transform/word_pieces.yaml
deleted file mode 100644
index 8ace2af..0000000
--- a/training/conf/datamodule/target_transform/word_pieces.yaml
+++ /dev/null
@@ -1,3 +0,0 @@
-word_pieces:
- _target_: text_recognizer.data.transforms.word_pieces.WordPieces
- max_len: 451
diff --git a/training/conf/datamodule/transform/barlow_paragraphs.yaml b/training/conf/datamodule/transform/barlow_paragraphs.yaml
new file mode 100644
index 0000000..5eefce5
--- /dev/null
+++ b/training/conf/datamodule/transform/barlow_paragraphs.yaml
@@ -0,0 +1,46 @@
+
+barlow:
+ _target_: text_recognizer.data.transforms.barlow.BarlowTransform
+ prim:
+ random_crop:
+ _target_: torchvision.transforms.RandomCrop
+ size: [576, 640]
+ padding: null
+ pad_if_needed: true
+ fill: 0
+ padding_mode: constant
+
+ color_jitter:
+ _target_: torchvision.transforms.ColorJitter
+ brightness: [0.8, 1.6]
+
+ random_affine:
+ _target_: torchvision.transforms.RandomAffine
+ degrees: 1
+ shear: [-10, 10]
+ interpolation: BILINEAR
+
+ to_tensor:
+ _target_: torchvision.transforms.ToTensor
+
+ bis:
+ random_crop:
+ _target_: torchvision.transforms.RandomCrop
+ size: [576, 640]
+ padding: null
+ pad_if_needed: true
+ fill: 0
+ padding_mode: constant
+
+ color_jitter:
+ _target_: torchvision.transforms.ColorJitter
+ brightness: [0.8, 2.0]
+
+ random_affine:
+ _target_: torchvision.transforms.RandomAffine
+ degrees: 1
+ shear: [-5, 5]
+ interpolation: BILINEAR
+
+ to_tensor:
+ _target_: torchvision.transforms.ToTensor