mtasic85 commited on
Commit
11df753
1 Parent(s): d15ab91

sophia_opt.SophiaG

Browse files
Files changed (1) hide show
  1. scripts/pretrain-model.yaml +1 -1
scripts/pretrain-model.yaml CHANGED
@@ -70,7 +70,7 @@ train:
70
 
71
  # Number of samples per data-parallel rank (type: int, default: 4)
72
  # micro_batch_size: 2
73
- micro_batch_size: 5
74
 
75
  # Number of iterations with learning rate warmup active (type: int, default: 2000)
76
  lr_warmup_steps: 2000
 
70
 
71
  # Number of samples per data-parallel rank (type: int, default: 4)
72
  # micro_batch_size: 2
73
+ micro_batch_size: 4
74
 
75
  # Number of iterations with learning rate warmup active (type: int, default: 2000)
76
  lr_warmup_steps: 2000