summaryrefslogtreecommitdiff
path: root/training/conf/network/vqvae.yaml
blob: 22f786f7527016bcad7eb1677f14ae292c6c932b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
defaults:
  - encoder: vae_encoder
  - decoder: vae_decoder

_target_: text_recognizer.networks.vqvae.vqvae.VQVAE
quantizer:
  _target_: text_recognizer.networks.quantizer.quantizer.VectorQuantizer
  input_dim: 128
  codebook:
    _target_: text_recognizer.networks.quantizer.codebook.CosineSimilarityCodebook
    dim: 8
    codebook_size: 512
    kmeans_init: true
    kmeans_iters: 10
    decay: 0.8
    eps: 1.0e-5
    threshold_dead: 2
  commitment: 1.0