AmberYifan commited on
Commit
f65c8f2
1 Parent(s): 96cd369

Training in progress, epoch 3, checkpoint

Browse files
last-checkpoint/global_step189/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73736d20e4b5078be3846f488716be6f8e377191d732f9dd074004b19b880cdb
3
+ size 13476836524
last-checkpoint/global_step189/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fff07b006b508703d293b537de80d632bb73464abe548b8db25000cf2ff7472a
3
+ size 13476836524
last-checkpoint/global_step189/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f396c83e2e063f7feaadcaa27cc4dfb30ac9e8f652e6ae84b91ae6a15c88c0
3
+ size 13476836524
last-checkpoint/global_step189/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c253541de0013ab57f2d4a91feadcdd9fa5668c6eaf3e583eefb06069b45689
3
+ size 13476836524
last-checkpoint/global_step189/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad6f8e38bd53cc02696fdd324acefc6450b408b94aa0efc4ff10b7c6725a66e
3
+ size 150693
last-checkpoint/global_step189/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2769a91ee3073096451825a14033196304aa61466a0742d138c51e7daf74827
3
+ size 150693
last-checkpoint/global_step189/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a1731958171867a7d85e560aa4daebfb823dbd70dd783e2e66bc88bb7340988
3
+ size 150693
last-checkpoint/global_step189/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65f5c3867311d6afda2cf705c7b21af911b58685f925c8915171e17d8ab9b14d
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step63
 
1
+ global_step189
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a18f906e422539d7561fb74fcbe4cda65c8dd8a58f49c0673740a6cbc3312e21
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95525d9c30b0213d4459f12201ac85cc3dcc181006ed5c82f4badf60c04d57c2
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b35678ee867b0ee73246f6cf7e43051df256f2bcc6845be8d2c0606598550c4
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae02f26857487c0ba98d339de83e4a15d2d435e050d87310ea9215f837474a82
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47ea9884ae8f8df38f905a0c4f62aecc15e57960dcee4e41334eb39453a817ac
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0fd6210a0d41e7f1f6251abc8cb58672cecda03d6cb318bd0e2a2023af05f6c
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1ce770862b76ceecb3453a5d0b9ef65311eab0f6a60f52997726a89d718de08
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab7cf0d34d60dfda516cf9661904550e2e294e723edd07c25c738f05e8ba92d1
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bcae6573442578b752be3e988d4ccb38056b45c31b5c02eb579ec6cebcfa62e
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7b183324e8227a51a9556d86b2ad893a8c4c52205ed4a737356c6611dac7353
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:398ff45072fee2975e88b9e078f915103d75d94bc08753303cf855b915973623
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac69e994090f4818cb1fa6f6cefa363178552c3c731c6507ff195bcb07fd5bef
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f4b210bc832d4c648e3bee8c21dca26e5a8b365d6ec90c638062005a052e57b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f68e61b63402f8afb1f69c960f7944965655dac11e3ccf29919c282f23931f86
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:845f8eea760ff90e22dadf5fb7f80c9079f8c2298a8770c5d4c3b3309b38a6ef
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c988df4a306242fbc45c908424c576078313f1b5bb472bee13c3b6371b94095e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 63,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -128,6 +128,218 @@
128
  "eval_samples_per_second": 16.341,
129
  "eval_steps_per_second": 0.572,
130
  "step": 63
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
131
  }
132
  ],
133
  "logging_steps": 10,
@@ -142,7 +354,7 @@
142
  "should_evaluate": false,
143
  "should_log": false,
144
  "should_save": true,
145
- "should_training_stop": false
146
  },
147
  "attributes": {}
148
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 189,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
128
  "eval_samples_per_second": 16.341,
129
  "eval_steps_per_second": 0.572,
130
  "step": 63
131
+ },
132
+ {
133
+ "epoch": 1.1111111111111112,
134
+ "grad_norm": 13.062522185911641,
135
+ "learning_rate": 3.5e-07,
136
+ "logits/chosen": -1.375,
137
+ "logits/rejected": -1.375,
138
+ "logps/chosen": -93.0,
139
+ "logps/rejected": -108.0,
140
+ "loss": 0.5617,
141
+ "rewards/accuracies": 0.7250000238418579,
142
+ "rewards/chosen": 0.1533203125,
143
+ "rewards/margins": 0.375,
144
+ "rewards/rejected": -0.220703125,
145
+ "step": 70
146
+ },
147
+ {
148
+ "epoch": 1.2698412698412698,
149
+ "grad_norm": 12.793133064546527,
150
+ "learning_rate": 3.205882352941177e-07,
151
+ "logits/chosen": -1.2421875,
152
+ "logits/rejected": -1.359375,
153
+ "logps/chosen": -82.5,
154
+ "logps/rejected": -112.5,
155
+ "loss": 0.5127,
156
+ "rewards/accuracies": 0.7749999761581421,
157
+ "rewards/chosen": 0.1455078125,
158
+ "rewards/margins": 0.515625,
159
+ "rewards/rejected": -0.37109375,
160
+ "step": 80
161
+ },
162
+ {
163
+ "epoch": 1.4285714285714286,
164
+ "grad_norm": 13.067935081505256,
165
+ "learning_rate": 2.911764705882353e-07,
166
+ "logits/chosen": -1.484375,
167
+ "logits/rejected": -1.3203125,
168
+ "logps/chosen": -100.0,
169
+ "logps/rejected": -98.0,
170
+ "loss": 0.5069,
171
+ "rewards/accuracies": 0.7875000238418579,
172
+ "rewards/chosen": 0.283203125,
173
+ "rewards/margins": 0.5390625,
174
+ "rewards/rejected": -0.2578125,
175
+ "step": 90
176
+ },
177
+ {
178
+ "epoch": 1.5873015873015874,
179
+ "grad_norm": 15.317610443936815,
180
+ "learning_rate": 2.6176470588235295e-07,
181
+ "logits/chosen": -1.3671875,
182
+ "logits/rejected": -1.375,
183
+ "logps/chosen": -90.0,
184
+ "logps/rejected": -111.0,
185
+ "loss": 0.4966,
186
+ "rewards/accuracies": 0.762499988079071,
187
+ "rewards/chosen": 0.2353515625,
188
+ "rewards/margins": 0.5546875,
189
+ "rewards/rejected": -0.318359375,
190
+ "step": 100
191
+ },
192
+ {
193
+ "epoch": 1.746031746031746,
194
+ "grad_norm": 12.447441760307086,
195
+ "learning_rate": 2.323529411764706e-07,
196
+ "logits/chosen": -1.4296875,
197
+ "logits/rejected": -1.296875,
198
+ "logps/chosen": -97.0,
199
+ "logps/rejected": -115.0,
200
+ "loss": 0.4934,
201
+ "rewards/accuracies": 0.887499988079071,
202
+ "rewards/chosen": 0.1435546875,
203
+ "rewards/margins": 0.56640625,
204
+ "rewards/rejected": -0.423828125,
205
+ "step": 110
206
+ },
207
+ {
208
+ "epoch": 1.9047619047619047,
209
+ "grad_norm": 13.19848987425151,
210
+ "learning_rate": 2.0294117647058823e-07,
211
+ "logits/chosen": -1.34375,
212
+ "logits/rejected": -1.34375,
213
+ "logps/chosen": -94.0,
214
+ "logps/rejected": -117.5,
215
+ "loss": 0.4805,
216
+ "rewards/accuracies": 0.8500000238418579,
217
+ "rewards/chosen": 0.10205078125,
218
+ "rewards/margins": 0.60546875,
219
+ "rewards/rejected": -0.50390625,
220
+ "step": 120
221
+ },
222
+ {
223
+ "epoch": 2.0,
224
+ "eval_logits/chosen": -1.34375,
225
+ "eval_logits/rejected": -1.328125,
226
+ "eval_logps/chosen": -92.0,
227
+ "eval_logps/rejected": -113.0,
228
+ "eval_loss": 0.5889843702316284,
229
+ "eval_rewards/accuracies": 0.6428571343421936,
230
+ "eval_rewards/chosen": -0.0751953125,
231
+ "eval_rewards/margins": 0.31640625,
232
+ "eval_rewards/rejected": -0.392578125,
233
+ "eval_runtime": 14.7924,
234
+ "eval_samples_per_second": 13.52,
235
+ "eval_steps_per_second": 0.473,
236
+ "step": 126
237
+ },
238
+ {
239
+ "epoch": 2.0634920634920633,
240
+ "grad_norm": 10.98673276740895,
241
+ "learning_rate": 1.7352941176470587e-07,
242
+ "logits/chosen": -1.390625,
243
+ "logits/rejected": -1.3984375,
244
+ "logps/chosen": -101.0,
245
+ "logps/rejected": -116.0,
246
+ "loss": 0.4562,
247
+ "rewards/accuracies": 0.862500011920929,
248
+ "rewards/chosen": 0.193359375,
249
+ "rewards/margins": 0.67578125,
250
+ "rewards/rejected": -0.482421875,
251
+ "step": 130
252
+ },
253
+ {
254
+ "epoch": 2.2222222222222223,
255
+ "grad_norm": 9.416416295176981,
256
+ "learning_rate": 1.441176470588235e-07,
257
+ "logits/chosen": -1.4140625,
258
+ "logits/rejected": -1.3828125,
259
+ "logps/chosen": -100.5,
260
+ "logps/rejected": -107.5,
261
+ "loss": 0.4104,
262
+ "rewards/accuracies": 0.862500011920929,
263
+ "rewards/chosen": 0.2099609375,
264
+ "rewards/margins": 0.76171875,
265
+ "rewards/rejected": -0.55078125,
266
+ "step": 140
267
+ },
268
+ {
269
+ "epoch": 2.380952380952381,
270
+ "grad_norm": 11.858508121730686,
271
+ "learning_rate": 1.1470588235294116e-07,
272
+ "logits/chosen": -1.3671875,
273
+ "logits/rejected": -1.3515625,
274
+ "logps/chosen": -93.5,
275
+ "logps/rejected": -113.5,
276
+ "loss": 0.413,
277
+ "rewards/accuracies": 0.8999999761581421,
278
+ "rewards/chosen": 0.2177734375,
279
+ "rewards/margins": 0.7265625,
280
+ "rewards/rejected": -0.51171875,
281
+ "step": 150
282
+ },
283
+ {
284
+ "epoch": 2.5396825396825395,
285
+ "grad_norm": 9.556697117699082,
286
+ "learning_rate": 8.529411764705883e-08,
287
+ "logits/chosen": -1.296875,
288
+ "logits/rejected": -1.4296875,
289
+ "logps/chosen": -90.5,
290
+ "logps/rejected": -108.5,
291
+ "loss": 0.4203,
292
+ "rewards/accuracies": 0.800000011920929,
293
+ "rewards/chosen": 0.1337890625,
294
+ "rewards/margins": 0.82421875,
295
+ "rewards/rejected": -0.69140625,
296
+ "step": 160
297
+ },
298
+ {
299
+ "epoch": 2.6984126984126986,
300
+ "grad_norm": 10.065550572065934,
301
+ "learning_rate": 5.5882352941176474e-08,
302
+ "logits/chosen": -1.3671875,
303
+ "logits/rejected": -1.3671875,
304
+ "logps/chosen": -98.5,
305
+ "logps/rejected": -109.5,
306
+ "loss": 0.4442,
307
+ "rewards/accuracies": 0.7749999761581421,
308
+ "rewards/chosen": 0.09814453125,
309
+ "rewards/margins": 0.734375,
310
+ "rewards/rejected": -0.63671875,
311
+ "step": 170
312
+ },
313
+ {
314
+ "epoch": 2.857142857142857,
315
+ "grad_norm": 11.316830865980743,
316
+ "learning_rate": 2.6470588235294116e-08,
317
+ "logits/chosen": -1.3515625,
318
+ "logits/rejected": -1.34375,
319
+ "logps/chosen": -102.0,
320
+ "logps/rejected": -104.5,
321
+ "loss": 0.4264,
322
+ "rewards/accuracies": 0.762499988079071,
323
+ "rewards/chosen": 0.10498046875,
324
+ "rewards/margins": 0.6328125,
325
+ "rewards/rejected": -0.52734375,
326
+ "step": 180
327
+ },
328
+ {
329
+ "epoch": 3.0,
330
+ "eval_logits/chosen": -1.3515625,
331
+ "eval_logits/rejected": -1.3359375,
332
+ "eval_logps/chosen": -92.5,
333
+ "eval_logps/rejected": -114.0,
334
+ "eval_loss": 0.5811718702316284,
335
+ "eval_rewards/accuracies": 0.6428571343421936,
336
+ "eval_rewards/chosen": -0.1357421875,
337
+ "eval_rewards/margins": 0.34765625,
338
+ "eval_rewards/rejected": -0.484375,
339
+ "eval_runtime": 14.7749,
340
+ "eval_samples_per_second": 13.537,
341
+ "eval_steps_per_second": 0.474,
342
+ "step": 189
343
  }
344
  ],
345
  "logging_steps": 10,
 
354
  "should_evaluate": false,
355
  "should_log": false,
356
  "should_save": true,
357
+ "should_training_stop": true
358
  },
359
  "attributes": {}
360
  }