blob: 904bd56b3edb25f28d200de847703b6b13a3fd35 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
|
_target_: text_recognizer.network.convnext.ConvNext
dim: 16
dim_mults: [2, 4, 8]
depths: [3, 3, 6]
downsampling_factors: [[2, 2], [2, 2], [2, 2]]
attn:
_target_: text_recognizer.network.convnext.TransformerBlock
attn:
_target_: text_recognizer.network.convnext.Attention
dim: 128
heads: 4
dim_head: 64
scale: 8
ff:
_target_: text_recognizer.network.convnext.FeedForward
dim: 128
mult: 4
|