diff options
Diffstat (limited to 'training/conf/network')
-rw-r--r-- | training/conf/network/decoder/vae_decoder.yaml | 4 | ||||
-rw-r--r-- | training/conf/network/encoder/vae_encoder.yaml | 4 | ||||
-rw-r--r-- | training/conf/network/vqvae.yaml | 2 |
3 files changed, 7 insertions, 3 deletions
diff --git a/training/conf/network/decoder/vae_decoder.yaml b/training/conf/network/decoder/vae_decoder.yaml index 8b5502d..aed5733 100644 --- a/training/conf/network/decoder/vae_decoder.yaml +++ b/training/conf/network/decoder/vae_decoder.yaml @@ -1,7 +1,9 @@ _target_: text_recognizer.networks.vqvae.decoder.Decoder out_channels: 1 hidden_dim: 32 -channels_multipliers: [4, 4, 2, 1] +channels_multipliers: [4, 2, 1] dropout_rate: 0.0 activation: mish use_norm: true +num_residuals: 4 +residual_channels: 32 diff --git a/training/conf/network/encoder/vae_encoder.yaml b/training/conf/network/encoder/vae_encoder.yaml index 33ae0b9..5d39bf7 100644 --- a/training/conf/network/encoder/vae_encoder.yaml +++ b/training/conf/network/encoder/vae_encoder.yaml @@ -1,7 +1,9 @@ _target_: text_recognizer.networks.vqvae.encoder.Encoder in_channels: 1 hidden_dim: 32 -channels_multipliers: [1, 2, 4, 4] +channels_multipliers: [1, 2, 4] dropout_rate: 0.0 activation: mish use_norm: true +num_residuals: 4 +residual_channels: 32 diff --git a/training/conf/network/vqvae.yaml b/training/conf/network/vqvae.yaml index d97e9b6..8210f04 100644 --- a/training/conf/network/vqvae.yaml +++ b/training/conf/network/vqvae.yaml @@ -5,5 +5,5 @@ defaults: _target_: text_recognizer.networks.vqvae.vqvae.VQVAE hidden_dim: 128 embedding_dim: 32 -num_embeddings: 1024 +num_embeddings: 8192 decay: 0.99 |