summaryrefslogtreecommitdiff
path: root/src/tasks/make_wordpieces.py
diff options
context:
space:
mode:
Diffstat (limited to 'src/tasks/make_wordpieces.py')
-rw-r--r--src/tasks/make_wordpieces.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/src/tasks/make_wordpieces.py b/src/tasks/make_wordpieces.py
index f605920..2ac0e2c 100644
--- a/src/tasks/make_wordpieces.py
+++ b/src/tasks/make_wordpieces.py
@@ -30,7 +30,7 @@ def iamdb_pieces(
user_symbols=["/"], # added so token is in the output set
)
- vocab = sorted(set(w for t in text for w in t.split("_") if w))
+ vocab = sorted(set(w for t in text for w in t.split("▁") if w))
if "move" not in vocab:
raise RuntimeError("`MOVE` not in vocab")