summaryrefslogtreecommitdiff
path: root/text_recognizer/tests/support
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2021-03-21 22:33:58 +0100
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2021-03-21 22:33:58 +0100
commite3741de333a3a43a7968241b6eccaaac66dd7b20 (patch)
tree7c50aee4ca61f77e95f1b038030292c64bbb86c2 /text_recognizer/tests/support
parentaac452a2dc008338cb543549652da293c14b6b4e (diff)
Working on EMNIST Lines dataset
Diffstat (limited to 'text_recognizer/tests/support')
-rw-r--r--text_recognizer/tests/support/__init__.py2
-rw-r--r--text_recognizer/tests/support/create_emnist_lines_support_files.py51
-rw-r--r--text_recognizer/tests/support/create_emnist_support_files.py30
-rw-r--r--text_recognizer/tests/support/create_iam_lines_support_files.py50
-rw-r--r--text_recognizer/tests/support/emnist_lines/Knox Ky<eos>.pngbin2301 -> 0 bytes
-rw-r--r--text_recognizer/tests/support/emnist_lines/ancillary beliefs and<eos>.pngbin5424 -> 0 bytes
-rw-r--r--text_recognizer/tests/support/emnist_lines/they<eos>.pngbin1391 -> 0 bytes
-rw-r--r--text_recognizer/tests/support/iam_lines/He rose from his breakfast-nook bench<eos>.pngbin5170 -> 0 bytes
-rw-r--r--text_recognizer/tests/support/iam_lines/and came into the livingroom, where<eos>.pngbin3617 -> 0 bytes
-rw-r--r--text_recognizer/tests/support/iam_lines/his entrance. He came, almost falling<eos>.pngbin3923 -> 0 bytes
-rw-r--r--text_recognizer/tests/support/iam_paragraphs/a01-000u.jpgbin14890 -> 0 bytes
11 files changed, 0 insertions, 133 deletions
diff --git a/text_recognizer/tests/support/__init__.py b/text_recognizer/tests/support/__init__.py
deleted file mode 100644
index a265ede..0000000
--- a/text_recognizer/tests/support/__init__.py
+++ /dev/null
@@ -1,2 +0,0 @@
-"""Support file modules."""
-from .create_emnist_support_files import create_emnist_support_files
diff --git a/text_recognizer/tests/support/create_emnist_lines_support_files.py b/text_recognizer/tests/support/create_emnist_lines_support_files.py
deleted file mode 100644
index 9abe143..0000000
--- a/text_recognizer/tests/support/create_emnist_lines_support_files.py
+++ /dev/null
@@ -1,51 +0,0 @@
-"""Module for creating EMNIST Lines test support files."""
-# flake8: noqa: S106
-
-from pathlib import Path
-import shutil
-
-import numpy as np
-
-from text_recognizer.datasets import EmnistLinesDataset
-import text_recognizer.util as util
-
-
-SUPPORT_DIRNAME = Path(__file__).parents[0].resolve() / "emnist_lines"
-
-
-def create_emnist_lines_support_files() -> None:
- """Create EMNIST Lines test images."""
- shutil.rmtree(SUPPORT_DIRNAME, ignore_errors=True)
- SUPPORT_DIRNAME.mkdir()
-
- # TODO: maybe have to add args to dataset.
- dataset = EmnistLinesDataset(
- init_token="<sos>",
- pad_token="_",
- eos_token="<eos>",
- transform=[{"type": "ToTensor", "args": {}}],
- target_transform=[
- {
- "type": "AddTokens",
- "args": {"init_token": "<sos>", "pad_token": "_", "eos_token": "<eos>"},
- }
- ],
- ) # nosec: S106
- dataset.load_or_generate_data()
-
- for index in [5, 7, 9]:
- image, target = dataset[index]
- if len(image.shape) == 3:
- image = image.squeeze(0)
- print(image.sum(), image.dtype)
-
- label = "".join(dataset.mapper(label) for label in target[1:]).strip(
- dataset.mapper.pad_token
- )
- print(label)
- image = image.numpy()
- util.write_image(image, str(SUPPORT_DIRNAME / f"{label}.png"))
-
-
-if __name__ == "__main__":
- create_emnist_lines_support_files()
diff --git a/text_recognizer/tests/support/create_emnist_support_files.py b/text_recognizer/tests/support/create_emnist_support_files.py
deleted file mode 100644
index f9ff030..0000000
--- a/text_recognizer/tests/support/create_emnist_support_files.py
+++ /dev/null
@@ -1,30 +0,0 @@
-"""Module for creating EMNIST test support files."""
-from pathlib import Path
-import shutil
-
-from text_recognizer.datasets import EmnistDataset
-from text_recognizer.util import write_image
-
-SUPPORT_DIRNAME = Path(__file__).parents[0].resolve() / "emnist"
-
-
-def create_emnist_support_files() -> None:
- """Create support images for test of CharacterPredictor class."""
- shutil.rmtree(SUPPORT_DIRNAME, ignore_errors=True)
- SUPPORT_DIRNAME.mkdir()
-
- dataset = EmnistDataset(train=False)
- dataset.load_or_generate_data()
-
- for index in [5, 7, 9]:
- image, label = dataset[index]
- if len(image.shape) == 3:
- image = image.squeeze(0)
- image = image.numpy()
- label = dataset.mapper(int(label))
- print(index, label)
- write_image(image, str(SUPPORT_DIRNAME / f"{label}.png"))
-
-
-if __name__ == "__main__":
- create_emnist_support_files()
diff --git a/text_recognizer/tests/support/create_iam_lines_support_files.py b/text_recognizer/tests/support/create_iam_lines_support_files.py
deleted file mode 100644
index 50f9e3d..0000000
--- a/text_recognizer/tests/support/create_iam_lines_support_files.py
+++ /dev/null
@@ -1,50 +0,0 @@
-"""Module for creating IAM Lines test support files."""
-# flake8: noqa
-from pathlib import Path
-import shutil
-
-import numpy as np
-
-from text_recognizer.datasets import IamLinesDataset
-import text_recognizer.util as util
-
-
-SUPPORT_DIRNAME = Path(__file__).parents[0].resolve() / "iam_lines"
-
-
-def create_emnist_lines_support_files() -> None:
- """Create IAM Lines test images."""
- shutil.rmtree(SUPPORT_DIRNAME, ignore_errors=True)
- SUPPORT_DIRNAME.mkdir()
-
- # TODO: maybe have to add args to dataset.
- dataset = IamLinesDataset(
- init_token="<sos>",
- pad_token="_",
- eos_token="<eos>",
- transform=[{"type": "ToTensor", "args": {}}],
- target_transform=[
- {
- "type": "AddTokens",
- "args": {"init_token": "<sos>", "pad_token": "_", "eos_token": "<eos>"},
- }
- ],
- )
- dataset.load_or_generate_data()
-
- for index in [0, 1, 3]:
- image, target = dataset[index]
- if len(image.shape) == 3:
- image = image.squeeze(0)
- print(image.sum(), image.dtype)
-
- label = "".join(dataset.mapper(label) for label in target[1:]).strip(
- dataset.mapper.pad_token
- )
- print(label)
- image = image.numpy()
- util.write_image(image, str(SUPPORT_DIRNAME / f"{label}.png"))
-
-
-if __name__ == "__main__":
- create_emnist_lines_support_files()
diff --git a/text_recognizer/tests/support/emnist_lines/Knox Ky<eos>.png b/text_recognizer/tests/support/emnist_lines/Knox Ky<eos>.png
deleted file mode 100644
index b7d0618..0000000
--- a/text_recognizer/tests/support/emnist_lines/Knox Ky<eos>.png
+++ /dev/null
Binary files differ
diff --git a/text_recognizer/tests/support/emnist_lines/ancillary beliefs and<eos>.png b/text_recognizer/tests/support/emnist_lines/ancillary beliefs and<eos>.png
deleted file mode 100644
index 14a8cf3..0000000
--- a/text_recognizer/tests/support/emnist_lines/ancillary beliefs and<eos>.png
+++ /dev/null
Binary files differ
diff --git a/text_recognizer/tests/support/emnist_lines/they<eos>.png b/text_recognizer/tests/support/emnist_lines/they<eos>.png
deleted file mode 100644
index 7f05951..0000000
--- a/text_recognizer/tests/support/emnist_lines/they<eos>.png
+++ /dev/null
Binary files differ
diff --git a/text_recognizer/tests/support/iam_lines/He rose from his breakfast-nook bench<eos>.png b/text_recognizer/tests/support/iam_lines/He rose from his breakfast-nook bench<eos>.png
deleted file mode 100644
index 6eeb642..0000000
--- a/text_recognizer/tests/support/iam_lines/He rose from his breakfast-nook bench<eos>.png
+++ /dev/null
Binary files differ
diff --git a/text_recognizer/tests/support/iam_lines/and came into the livingroom, where<eos>.png b/text_recognizer/tests/support/iam_lines/and came into the livingroom, where<eos>.png
deleted file mode 100644
index 4974cf8..0000000
--- a/text_recognizer/tests/support/iam_lines/and came into the livingroom, where<eos>.png
+++ /dev/null
Binary files differ
diff --git a/text_recognizer/tests/support/iam_lines/his entrance. He came, almost falling<eos>.png b/text_recognizer/tests/support/iam_lines/his entrance. He came, almost falling<eos>.png
deleted file mode 100644
index a731245..0000000
--- a/text_recognizer/tests/support/iam_lines/his entrance. He came, almost falling<eos>.png
+++ /dev/null
Binary files differ
diff --git a/text_recognizer/tests/support/iam_paragraphs/a01-000u.jpg b/text_recognizer/tests/support/iam_paragraphs/a01-000u.jpg
deleted file mode 100644
index d9753b6..0000000
--- a/text_recognizer/tests/support/iam_paragraphs/a01-000u.jpg
+++ /dev/null
Binary files differ