pretrain 1
Browse files
scripts/pretrain_core_model_1.yaml
CHANGED
@@ -85,7 +85,7 @@ train:
|
|
85 |
max_norm: 1.0
|
86 |
|
87 |
# (type: float, default: 4e-05)
|
88 |
-
min_lr:
|
89 |
|
90 |
# Evaluation-related arguments. See ``litgpt.args.EvalArgs`` for details
|
91 |
eval:
|
@@ -125,7 +125,7 @@ eval:
|
|
125 |
optimizer:
|
126 |
class_path: sophia_opt.SophiaG
|
127 |
init_args:
|
128 |
-
lr:
|
129 |
betas:
|
130 |
- 0.9
|
131 |
- 0.95
|
|
|
85 |
max_norm: 1.0
|
86 |
|
87 |
# (type: float, default: 4e-05)
|
88 |
+
min_lr: 5e-5
|
89 |
|
90 |
# Evaluation-related arguments. See ``litgpt.args.EvalArgs`` for details
|
91 |
eval:
|
|
|
125 |
optimizer:
|
126 |
class_path: sophia_opt.SophiaG
|
127 |
init_args:
|
128 |
+
lr: 1e-4
|
129 |
betas:
|
130 |
- 0.9
|
131 |
- 0.95
|