From c9c60678673e19ad3367339eb8e7a093e5a98474 Mon Sep 17 00:00:00 2001 From: Gustaf Rydholm Date: Sun, 9 May 2021 22:46:09 +0200 Subject: Reformatting of positional encodings and ViT working --- text_recognizer/networks/vision_transformer.py | 7 +++++++ 1 file changed, 7 insertions(+) create mode 100644 text_recognizer/networks/vision_transformer.py (limited to 'text_recognizer/networks/vision_transformer.py') diff --git a/text_recognizer/networks/vision_transformer.py b/text_recognizer/networks/vision_transformer.py new file mode 100644 index 0000000..b617c71 --- /dev/null +++ b/text_recognizer/networks/vision_transformer.py @@ -0,0 +1,7 @@ +"""Vision transformer for character recognition.""" +from torch import nn, Tensor + + +class VisionTransformer(nn.Module): + def __init__(self,) -> None: + pass -- cgit v1.2.3-70-g09d2