From 34098ccbbbf6379c0bd29a987440b8479c743746 Mon Sep 17 00:00:00 2001 From: Gustaf Rydholm Date: Thu, 29 Jul 2021 23:59:52 +0200 Subject: Configs, refactor with attrs, fix attr bug in iam --- training/conf/criterion/label_smoothing.yaml | 4 ++++ training/conf/mapping/word_piece.yaml | 9 +++++++++ training/conf/model/lit_transformer.yaml | 4 ++++ training/conf/network/conv_transformer.yaml | 13 +++++++++++++ 4 files changed, 30 insertions(+) create mode 100644 training/conf/mapping/word_piece.yaml create mode 100644 training/conf/model/lit_transformer.yaml create mode 100644 training/conf/network/conv_transformer.yaml (limited to 'training') diff --git a/training/conf/criterion/label_smoothing.yaml b/training/conf/criterion/label_smoothing.yaml index e69de29..ee47c59 100644 --- a/training/conf/criterion/label_smoothing.yaml +++ b/training/conf/criterion/label_smoothing.yaml @@ -0,0 +1,4 @@ +_target_: text_recognizer.criterion.label_smoothing +label_smoothing: 0.1 +vocab_size: 1006 +ignore_index: 1002 diff --git a/training/conf/mapping/word_piece.yaml b/training/conf/mapping/word_piece.yaml new file mode 100644 index 0000000..39e2ba4 --- /dev/null +++ b/training/conf/mapping/word_piece.yaml @@ -0,0 +1,9 @@ +_target_: text_recognizer.data.mappings.WordPieceMapping +num_features: 1000 +tokens: iamdb_1kwp_tokens_1000.txt +lexicon: iamdb_1kwp_lex_1000.txt +data_dir: null +use_words: false +prepend_wordsep: false +special_tokens: ["", "", "

"] +extra_symbols: ["\n"] diff --git a/training/conf/model/lit_transformer.yaml b/training/conf/model/lit_transformer.yaml new file mode 100644 index 0000000..4e04b85 --- /dev/null +++ b/training/conf/model/lit_transformer.yaml @@ -0,0 +1,4 @@ +_target_: text_recognizer.models.transformer.TransformerLitModel +interval: null +monitor: val/loss +ignore_tokens: ["", "", "

"] diff --git a/training/conf/network/conv_transformer.yaml b/training/conf/network/conv_transformer.yaml new file mode 100644 index 0000000..f72e030 --- /dev/null +++ b/training/conf/network/conv_transformer.yaml @@ -0,0 +1,13 @@ +defaults: + - encoder: efficientnet + - decoder: transformer_decoder + +_target_: text_recognizer.networks.conv_transformer.ConvTransformer +input_dims: [1, 576, 640] +hidden_dim: 256 +dropout_rate: 0.2 +max_output_len: 682 +num_classes: 1004 +start_token: +end_token: +pad_token:

-- cgit v1.2.3-70-g09d2