summaryrefslogtreecommitdiff
path: root/training/conf/optimizer
diff options
context:
space:
mode:
authorGustaf Rydholm <gustaf.rydholm@gmail.com>2023-09-11 22:15:26 +0200
committerGustaf Rydholm <gustaf.rydholm@gmail.com>2023-09-11 22:15:26 +0200
commit56dc112cfb649217cd624b4ff305e2db83a383b7 (patch)
tree92555f27313f8bb4650a3d8dfa1c88ac6e1bfbf8 /training/conf/optimizer
parentbece39632a83ef3c8c0f49c753cbc6110d2f78b9 (diff)
Update configs
Diffstat (limited to 'training/conf/optimizer')
-rw-r--r--training/conf/optimizer/adamw.yaml5
-rw-r--r--training/conf/optimizer/adan.yaml4
-rw-r--r--training/conf/optimizer/lion.yaml5
3 files changed, 14 insertions, 0 deletions
diff --git a/training/conf/optimizer/adamw.yaml b/training/conf/optimizer/adamw.yaml
new file mode 100644
index 0000000..568c67b
--- /dev/null
+++ b/training/conf/optimizer/adamw.yaml
@@ -0,0 +1,5 @@
+_target_: torch.optim.AdamW
+lr: 1.5e-4
+betas: [0.95, 0.98]
+weight_decay: 1.0e-2
+eps: 1.0e-6
diff --git a/training/conf/optimizer/adan.yaml b/training/conf/optimizer/adan.yaml
new file mode 100644
index 0000000..6950a86
--- /dev/null
+++ b/training/conf/optimizer/adan.yaml
@@ -0,0 +1,4 @@
+_target_: adan_pytorch.Adan
+lr: 2.0e-4
+betas: [0.02, 0.08, 0.01]
+weight_decay: 0.02
diff --git a/training/conf/optimizer/lion.yaml b/training/conf/optimizer/lion.yaml
new file mode 100644
index 0000000..cbf386a
--- /dev/null
+++ b/training/conf/optimizer/lion.yaml
@@ -0,0 +1,5 @@
+_target_: lion_pytorch.Lion
+lr: 5e-5
+betas: [0.95, 0.99]
+weight_decay: 0.1
+use_triton: true