diff options
| author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-10-02 02:55:00 +0200 | 
|---|---|---|
| committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2022-10-02 02:55:00 +0200 | 
| commit | 7d06b7a23fb6340bdf2d2ddee0941ae8c8ee4217 (patch) | |
| tree | 4c07ab7eff44021a2717af47400781cdcc74c576 /training/conf | |
| parent | 20b851f1918bcfc122edd1161a33fd496f82ee86 (diff) | |
Add sweep conf
Diffstat (limited to 'training/conf')
| -rw-r--r-- | training/conf/sweep/conv_transformer.yaml | 29 | 
1 files changed, 29 insertions, 0 deletions
diff --git a/training/conf/sweep/conv_transformer.yaml b/training/conf/sweep/conv_transformer.yaml new file mode 100644 index 0000000..70e0a56 --- /dev/null +++ b/training/conf/sweep/conv_transformer.yaml @@ -0,0 +1,29 @@ +# @package _global_ + +# Example: +# python main.py -m sweep=lines experiment=conv_transformer_lines + +defaults: +  - override /hydra/sweeper: optuna + +optimized_metric: train/loss + +hydra: +  mode: "MULTIRUN" +  sweeper: +    _target_: hydra_plugins.hydra_optuna_sweeper.optuna_sweeper.OptunaSweeper +    storage: null +    study_name: null +    n_jobs: 1 +    direction: minimize +    n_trials: 20 +    sampler: +      _target_: optuna.samplers.TPESampler +      seed: 4711 +      n_startup_trials: 5 + +    params: +      # optimizer: interval(0.0003, 0.001) +      network.decoder.decoder.depth: choice(4, 8, 10) +      network.decoder.decoder.block.self_attn.num_heads: choice(4, 6, 8) +      network.decoder.decoder.block.cross_attn.num_heads: choice(6, 8, 12)  |