summaryrefslogtreecommitdiff
path: root/Makefile
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2021-09-30 23:57:49 +0200
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2021-09-30 23:57:49 +0200
commit11ce8d3de5894f5055de41921483f3ed8af65a0e (patch)
tree6197ed66ef67ef2844e968835494db74076002ff /Makefile
parent5c2a4ea8aa6b2da1a6fe6f29a59a8ba20abcc38f (diff)
Add Makefile for downloading and generating datasets
Diffstat (limited to 'Makefile')
-rw-r--r--Makefile16
1 files changed, 16 insertions, 0 deletions
diff --git a/Makefile b/Makefile
new file mode 100644
index 0000000..2fb2148
--- /dev/null
+++ b/Makefile
@@ -0,0 +1,16 @@
+.POSIX:
+
+download:
+ poetry run download-emnist
+ poetry run download-nltk
+ poetry run download-iam
+
+generate:
+ poetry run generate-emnist-lines
+ poetry run generate-iam-lines
+ poetry run generate-iam-paragraphs
+ poetry run generate-iam-synthetic-paragraphs
+ poetry run extract-iam-text --use_words --save_text train.txt --save_tokens letters.txt
+ poetry run make-wordpieces --output_prefix iamdb_1kwp --text_file train.txt --num_pieces 1000
+
+.PHONY: download generate