diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-10-02 02:55:00 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-10-02 02:55:00 +0200 |
commit | 7d06b7a23fb6340bdf2d2ddee0941ae8c8ee4217 (patch) | |
tree | 4c07ab7eff44021a2717af47400781cdcc74c576 | |
parent | 20b851f1918bcfc122edd1161a33fd496f82ee86 (diff) |
Add sweep conf
-rw-r--r-- | training/conf/sweep/conv_transformer.yaml | 29 |
1 files changed, 29 insertions, 0 deletions
diff --git a/training/conf/sweep/conv_transformer.yaml b/training/conf/sweep/conv_transformer.yaml new file mode 100644 index 0000000..70e0a56 --- /dev/null +++ b/training/conf/sweep/conv_transformer.yaml @@ -0,0 +1,29 @@ +# @package _global_ + +# Example: +# python main.py -m sweep=lines experiment=conv_transformer_lines + +defaults: + - override /hydra/sweeper: optuna + +optimized_metric: train/loss + +hydra: + mode: "MULTIRUN" + sweeper: + _target_: hydra_plugins.hydra_optuna_sweeper.optuna_sweeper.OptunaSweeper + storage: null + study_name: null + n_jobs: 1 + direction: minimize + n_trials: 20 + sampler: + _target_: optuna.samplers.TPESampler + seed: 4711 + n_startup_trials: 5 + + params: + # optimizer: interval(0.0003, 0.001) + network.decoder.decoder.depth: choice(4, 8, 10) + network.decoder.decoder.block.self_attn.num_heads: choice(4, 6, 8) + network.decoder.decoder.block.cross_attn.num_heads: choice(6, 8, 12) |