summaryrefslogtreecommitdiff
path: root/training/conf/network/convnext.yaml
blob: 63ad424cc8889dad2419786991852d5378d390d5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
_target_: text_recognizer.networks.convnext.ConvNext
dim: 16
dim_mults: [2, 4, 8]
depths: [3, 3, 6]
downsampling_factors: [[2, 2], [2, 2], [2, 2]]
attn:
  _target_: text_recognizer.networks.convnext.TransformerBlock
  attn:
    _target_: text_recognizer.networks.convnext.Attention
    dim: 128
    heads: 4
    dim_head: 64
    scale: 8
  ff:
    _target_: text_recognizer.networks.convnext.FeedForward
    dim: 128
    mult: 4