sophia_opt.SophiaG
Browse files
scripts/pretrain-model.yaml
CHANGED
@@ -71,7 +71,7 @@ train:
|
|
71 |
micro_batch_size: 2
|
72 |
|
73 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
74 |
-
lr_warmup_steps:
|
75 |
|
76 |
# Number of epochs to train on (type: Optional[int], default: null)
|
77 |
epochs:
|
|
|
71 |
micro_batch_size: 2
|
72 |
|
73 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
74 |
+
lr_warmup_steps: 0
|
75 |
|
76 |
# Number of epochs to train on (type: Optional[int], default: null)
|
77 |
epochs:
|