summaryrefslogtreecommitdiff
path: root/training/conf/model
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2021-07-30 23:15:03 +0200
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2021-07-30 23:15:03 +0200
commit7268035fb9e57342612a8cc50a1fe04e8841ca2f (patch)
tree8d4cf3743975bd25f2c04d6a56ff3d4608a7e8d9 /training/conf/model
parent92fc1c7ed2f9f64552be8f71d9b8ab0d5a0a88d4 (diff)
attr bug fix, properly loading network
Diffstat (limited to 'training/conf/model')
-rw-r--r--training/conf/model/lit_transformer.yaml8
-rw-r--r--training/conf/model/mapping/word_piece.yaml9
2 files changed, 16 insertions, 1 deletions
diff --git a/training/conf/model/lit_transformer.yaml b/training/conf/model/lit_transformer.yaml
index 4e04b85..5341d8e 100644
--- a/training/conf/model/lit_transformer.yaml
+++ b/training/conf/model/lit_transformer.yaml
@@ -1,4 +1,10 @@
+defaults:
+ - mapping: word_piece
+
_target_: text_recognizer.models.transformer.TransformerLitModel
interval: null
monitor: val/loss
-ignore_tokens: ["<s>", "<e>", "<p>"]
+ignore_tokens: [ <s>, <e>, <p> ]
+start_token: <s>
+end_token: <e>
+pad_token: <p>
diff --git a/training/conf/model/mapping/word_piece.yaml b/training/conf/model/mapping/word_piece.yaml
new file mode 100644
index 0000000..39e2ba4
--- /dev/null
+++ b/training/conf/model/mapping/word_piece.yaml
@@ -0,0 +1,9 @@
+_target_: text_recognizer.data.mappings.WordPieceMapping
+num_features: 1000
+tokens: iamdb_1kwp_tokens_1000.txt
+lexicon: iamdb_1kwp_lex_1000.txt
+data_dir: null
+use_words: false
+prepend_wordsep: false
+special_tokens: ["<s>", "<e>", "<p>"]
+extra_symbols: ["\n"]