sophia_opt.SophiaG
Browse files
scripts/pretrain-model.yaml
CHANGED
@@ -70,7 +70,7 @@ train:
|
|
70 |
|
71 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
72 |
# micro_batch_size: 2
|
73 |
-
micro_batch_size:
|
74 |
|
75 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
76 |
lr_warmup_steps: 2000
|
|
|
70 |
|
71 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
72 |
# micro_batch_size: 2
|
73 |
+
micro_batch_size: 4
|
74 |
|
75 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
76 |
lr_warmup_steps: 2000
|