_target_: text_recognizer.networks.vqvae.VQVAE in_channels: 1 res_channels: 32 num_residual_layers: 2 embedding_dim: 64 num_embeddings: 512 decay: 0.99 activation: mish