diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2021-08-06 02:42:45 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2021-08-06 02:42:45 +0200 |
commit | 3ab82ad36bce6fa698a13a029a0694b75a5947b7 (patch) | |
tree | 136f71a62d60e3ccf01e1f95d64bb4d9f9c9befe /training/conf/network | |
parent | 1bccf71cf4eec335001b50a8fbc0c991d0e6d13a (diff) |
Fix VQVAE into en/decoder, bug in wandb artifact code uploading
Diffstat (limited to 'training/conf/network')
-rw-r--r-- | training/conf/network/decoder/pixelcnn_encoder.yaml | 5 | ||||
-rw-r--r-- | training/conf/network/decoder/vae_decoder.yaml | 5 | ||||
-rw-r--r-- | training/conf/network/encoder/pixelcnn_decoder.yaml | 5 | ||||
-rw-r--r-- | training/conf/network/encoder/vae_encoder.yaml | 5 | ||||
-rw-r--r-- | training/conf/network/vqvae.yaml | 15 | ||||
-rw-r--r-- | training/conf/network/vqvae_pixelcnn.yaml | 9 |
6 files changed, 37 insertions, 7 deletions
diff --git a/training/conf/network/decoder/pixelcnn_encoder.yaml b/training/conf/network/decoder/pixelcnn_encoder.yaml new file mode 100644 index 0000000..47a130d --- /dev/null +++ b/training/conf/network/decoder/pixelcnn_encoder.yaml @@ -0,0 +1,5 @@ +_target_: text_recognizer.networks.vqvae.pixelcnn.Encoder +in_channels: 1 +hidden_dim: 8 +channels_multipliers: [1, 2, 8, 8] +dropout_rate: 0.25 diff --git a/training/conf/network/decoder/vae_decoder.yaml b/training/conf/network/decoder/vae_decoder.yaml new file mode 100644 index 0000000..b2090b3 --- /dev/null +++ b/training/conf/network/decoder/vae_decoder.yaml @@ -0,0 +1,5 @@ +_target_: text_recognizer.networks.vqvae.decoder.Decoder +out_channels: 1 +hidden_dim: 32 +channels_multipliers: [8, 6, 2, 1] +dropout_rate: 0.25 diff --git a/training/conf/network/encoder/pixelcnn_decoder.yaml b/training/conf/network/encoder/pixelcnn_decoder.yaml new file mode 100644 index 0000000..3895164 --- /dev/null +++ b/training/conf/network/encoder/pixelcnn_decoder.yaml @@ -0,0 +1,5 @@ +_target_: text_recognizer.networks.vqvae.pixelcnn.Decoder +out_channels: 1 +hidden_dim: 8 +channels_multipliers: [8, 8, 2, 1] +dropout_rate: 0.25 diff --git a/training/conf/network/encoder/vae_encoder.yaml b/training/conf/network/encoder/vae_encoder.yaml new file mode 100644 index 0000000..5dc6814 --- /dev/null +++ b/training/conf/network/encoder/vae_encoder.yaml @@ -0,0 +1,5 @@ +_target_: text_recognizer.networks.vqvae.encoder.Encoder +in_channels: 1 +hidden_dim: 32 +channels_multipliers: [1, 2, 6, 8] +dropout_rate: 0.25 diff --git a/training/conf/network/vqvae.yaml b/training/conf/network/vqvae.yaml index 5a5c066..835d0b7 100644 --- a/training/conf/network/vqvae.yaml +++ b/training/conf/network/vqvae.yaml @@ -1,8 +1,9 @@ -_target_: text_recognizer.networks.vqvae.VQVAE -in_channels: 1 -res_channels: 32 -num_residual_layers: 2 -embedding_dim: 64 -num_embeddings: 512 +defaults: + - encoder: vae_encoder + - decoder: vae_decoder + +_target_: text_recognizer.networks.vqvae.vqvae.VQVAE +hidden_dim: 256 +embedding_dim: 32 +num_embeddings: 1024 decay: 0.99 -activation: mish diff --git a/training/conf/network/vqvae_pixelcnn.yaml b/training/conf/network/vqvae_pixelcnn.yaml new file mode 100644 index 0000000..10200bc --- /dev/null +++ b/training/conf/network/vqvae_pixelcnn.yaml @@ -0,0 +1,9 @@ +defaults: + - encoder: pixelcnn_encoder + - decoder: pixelcnn_decoder + +_target_: text_recognizer.networks.vqvae.vqvae.VQVAE +hidden_dim: 64 +embedding_dim: 32 +num_embeddings: 512 +decay: 0.99 |