Efficient net and non working transformer model.

author: Gustaf Rydholm <gustaf.rydholm@gmail.com> 2021-04-25 23:32:50 +0200
committer: Gustaf Rydholm <gustaf.rydholm@gmail.com> 2021-04-25 23:32:50 +0200
commit: 9426cc794d8c28a65bbbf5ae5466a0a343078558 (patch)
tree: 44e31b0a7c58597d603ac29a693462aae4b6e9b0 /text_recognizer/networks/transformer/positional_encoding.py
parent: 4e60c836fb710baceba570c28c06437db3ad5c9b (diff)
1 files changed, 5 insertions, 1 deletions
diff --git a/text_recognizer/networks/transformer/positional_encoding.py b/text_recognizer/networks/transformer/positional_encoding.py
index 5874e97..c50afc3 100644
--- a/text_recognizer/networks/transformer/positional_encoding.py
+++ b/text_recognizer/networks/transformer/positional_encoding.py
@@ -33,7 +33,10 @@ class PositionalEncoding(nn.Module):
 
     def forward(self, x: Tensor) -> Tensor:
         """Encodes the tensor with a postional embedding."""
-        x = x + self.pe[:, : x.shape[1]]
+        # [T, B, D]
+        if x.shape[2] != self.pe.shape[2]:
+            raise ValueError(f"x shape does not match pe in the 3rd dim.")
+        x = x + self.pe[: x.shape[0]]
         return self.dropout(x)
 
 
@@ -48,6 +51,7 @@ class PositionalEncoding2D(nn.Module):
         pe = self.make_pe(hidden_dim, max_h, max_w)
         self.register_buffer("pe", pe)
 
+    @staticmethod
     def make_pe(hidden_dim: int, max_h: int, max_w: int) -> Tensor:
         """Returns 2d postional encoding."""
         pe_h = PositionalEncoding.make_pe(
author	Gustaf Rydholm <gustaf.rydholm@gmail.com>	2021-04-25 23:32:50 +0200
committer	Gustaf Rydholm <gustaf.rydholm@gmail.com>	2021-04-25 23:32:50 +0200
commit	9426cc794d8c28a65bbbf5ae5466a0a343078558 (patch)
tree	44e31b0a7c58597d603ac29a693462aae4b6e9b0 /text_recognizer/networks/transformer/positional_encoding.py
parent	4e60c836fb710baceba570c28c06437db3ad5c9b (diff)