diff options
author | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2023-09-11 22:15:26 +0200 |
---|---|---|
committer | Gustaf Rydholm <gustaf.rydholm@gmail.com> | 2023-09-11 22:15:26 +0200 |
commit | 56dc112cfb649217cd624b4ff305e2db83a383b7 (patch) | |
tree | 92555f27313f8bb4650a3d8dfa1c88ac6e1bfbf8 /training/conf/optimizer | |
parent | bece39632a83ef3c8c0f49c753cbc6110d2f78b9 (diff) |
Update configs
Diffstat (limited to 'training/conf/optimizer')
-rw-r--r-- | training/conf/optimizer/adamw.yaml | 5 | ||||
-rw-r--r-- | training/conf/optimizer/adan.yaml | 4 | ||||
-rw-r--r-- | training/conf/optimizer/lion.yaml | 5 |
3 files changed, 14 insertions, 0 deletions
diff --git a/training/conf/optimizer/adamw.yaml b/training/conf/optimizer/adamw.yaml new file mode 100644 index 0000000..568c67b --- /dev/null +++ b/training/conf/optimizer/adamw.yaml @@ -0,0 +1,5 @@ +_target_: torch.optim.AdamW +lr: 1.5e-4 +betas: [0.95, 0.98] +weight_decay: 1.0e-2 +eps: 1.0e-6 diff --git a/training/conf/optimizer/adan.yaml b/training/conf/optimizer/adan.yaml new file mode 100644 index 0000000..6950a86 --- /dev/null +++ b/training/conf/optimizer/adan.yaml @@ -0,0 +1,4 @@ +_target_: adan_pytorch.Adan +lr: 2.0e-4 +betas: [0.02, 0.08, 0.01] +weight_decay: 0.02 diff --git a/training/conf/optimizer/lion.yaml b/training/conf/optimizer/lion.yaml new file mode 100644 index 0000000..cbf386a --- /dev/null +++ b/training/conf/optimizer/lion.yaml @@ -0,0 +1,5 @@ +_target_: lion_pytorch.Lion +lr: 5e-5 +betas: [0.95, 0.99] +weight_decay: 0.1 +use_triton: true |