criterion: CrossEntropyLoss criterion_args: ignore_index: -100 reduction: mean weight: null data_loader_args: batch_size: 256 cuda: true num_workers: 8 sample_to_balance: true seed: 4711 shuffle: true splits: - train - val subsample_fraction: null target_transform: null transform: null dataloader: EmnistDataLoader device: cuda:0 experiment_group: Sample Experiments lr_scheduler: OneCycleLR lr_scheduler_args: epochs: 16 max_lr: 0.001 steps_per_epoch: 1314 metrics: - accuracy model: CharacterModel network: MLP network_args: input_size: 784 num_layers: 3 output_size: 62 optimizer: AdamW optimizer_args: amsgrad: false betas: - 0.9 - 0.999 eps: 1.0e-08 lr: 0.01 weight_decay: 0 resume_experiment: null train_args: batch_size: 256 epochs: 16 val_metric: accuracy verbosity: 2