From 240f5e9f20032e82515fa66ce784619527d1041e Mon Sep 17 00:00:00 2001 From: Gustaf Rydholm Date: Sun, 8 Aug 2021 19:59:55 +0200 Subject: Add VQGAN and loss function --- training/conf/network/decoder/pixelcnn_decoder.yaml | 5 +++++ training/conf/network/decoder/pixelcnn_encoder.yaml | 5 ----- training/conf/network/decoder/vae_decoder.yaml | 2 +- 3 files changed, 6 insertions(+), 6 deletions(-) create mode 100644 training/conf/network/decoder/pixelcnn_decoder.yaml delete mode 100644 training/conf/network/decoder/pixelcnn_encoder.yaml (limited to 'training/conf/network/decoder') diff --git a/training/conf/network/decoder/pixelcnn_decoder.yaml b/training/conf/network/decoder/pixelcnn_decoder.yaml new file mode 100644 index 0000000..cdddb7a --- /dev/null +++ b/training/conf/network/decoder/pixelcnn_decoder.yaml @@ -0,0 +1,5 @@ +_target_: text_recognizer.networks.vqvae.pixelcnn.Decoder +out_channels: 1 +hidden_dim: 8 +channels_multipliers: [8, 2, 1] +dropout_rate: 0.25 diff --git a/training/conf/network/decoder/pixelcnn_encoder.yaml b/training/conf/network/decoder/pixelcnn_encoder.yaml deleted file mode 100644 index 47a130d..0000000 --- a/training/conf/network/decoder/pixelcnn_encoder.yaml +++ /dev/null @@ -1,5 +0,0 @@ -_target_: text_recognizer.networks.vqvae.pixelcnn.Encoder -in_channels: 1 -hidden_dim: 8 -channels_multipliers: [1, 2, 8, 8] -dropout_rate: 0.25 diff --git a/training/conf/network/decoder/vae_decoder.yaml b/training/conf/network/decoder/vae_decoder.yaml index 0a36a54..a5e7286 100644 --- a/training/conf/network/decoder/vae_decoder.yaml +++ b/training/conf/network/decoder/vae_decoder.yaml @@ -1,5 +1,5 @@ _target_: text_recognizer.networks.vqvae.decoder.Decoder out_channels: 1 hidden_dim: 32 -channels_multipliers: [4, 4, 2, 1] +channels_multipliers: [8, 8, 4, 1] dropout_rate: 0.25 -- cgit v1.2.3-70-g09d2