criterion: CrossEntropyLoss criterion_args: ignore_index: -100 reduction: mean weight: null data_loader_args: batch_size: 256 cuda: true num_workers: 0 sample_to_balance: true seed: 4711 shuffle: true splits: - train - val subsample_fraction: null target_transform: null transform: null dataloader: EmnistDataLoader device: cuda:0 experiment_group: Sample Experiments lr_scheduler: OneCycleLR lr_scheduler_args: epochs: 16 max_lr: 0.0003 steps_per_epoch: 1314 metrics: - accuracy model: CharacterModel network: MLP network_args: input_size: 784 num_layers: 3 output_size: 62 optimizer: AdamW optimizer_args: amsgrad: false betas: - 0.9 - 0.999 eps: 1.0e-08 lr: 0.0006 weight_decay: 5.0e-05 train_args: batch_size: 256 epochs: 16 val_metric: accuracy