lvwerra HF Staff commited on
Commit
cd6f029
·
1 Parent(s): e3d9b66
Files changed (1) hide show
  1. codeparrot_training.py +3 -3
codeparrot_training.py CHANGED
@@ -123,11 +123,11 @@ config = {"train_batch_size": 12,
123
  "lr_scheduler_type": "cosine",
124
  "num_warmup_steps": 2000,
125
  "gradient_accumulation_steps": 1,
126
- "max_train_steps": 8192,
127
- "max_eval_steps": 512,
128
  "seq_length": 1024,
129
  "seed": 1,
130
- "save_checkpoint_steps":512,}
131
  args = Namespace(**config)
132
  set_seed(args.seed)
133
 
 
123
  "lr_scheduler_type": "cosine",
124
  "num_warmup_steps": 2000,
125
  "gradient_accumulation_steps": 1,
126
+ "max_train_steps": 150_000,
127
+ "max_eval_steps": -1,
128
  "seq_length": 1024,
129
  "seed": 1,
130
+ "save_checkpoint_steps": 15_000}
131
  args = Namespace(**config)
132
  set_seed(args.seed)
133