pilotj commited on
Commit
714e98e
·
verified ·
1 Parent(s): f07885d

Training in progress, step 5500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7769a8b409b9f5cc8c4fcca71fea9c10feaff3ae5f6eda49319a9524c31c745
3
  size 498686648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9900b3c186c079bcb23fca4d7455eb1c1fa4a6834aa080210c16cf89ed37cf6a
3
  size 498686648
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf482bdae897d5287fa2e8b439dcd2c6189371c6a214d2ce6b7eba7aa13fa0f0
3
  size 997493050
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79da3e9caf7d4d2e6f1dcc2334761728f64c3e8f0ede33e99992bae602b52fc1
3
  size 997493050
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee729c95a8d92e4810522cb347750f57fd0b0ec5c06f7992ee2be85d4a78ab4b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:721bc7a5b221d6b012d2388a6a09216865e2462e31bd2e0fe77aaddae689aeb6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65c4d3964df52c8d20548263cfeb8b6c3ec321803a92f2244badb7ff92803145
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e27a97977fcc445cdd5c99153117efc644690cb82cdc8080515d4ff3a8dec66
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.4090208411216736,
3
  "best_model_checkpoint": "results/checkpoint-5000",
4
- "epoch": 0.948136910969944,
5
  "eval_steps": 500,
6
- "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -207,6 +207,26 @@
207
  "eval_samples_per_second": 57.28,
208
  "eval_steps_per_second": 0.45,
209
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
210
  }
211
  ],
212
  "logging_steps": 500,
@@ -226,7 +246,7 @@
226
  "attributes": {}
227
  }
228
  },
229
- "total_flos": 1.6842736140288e+17,
230
  "train_batch_size": 32,
231
  "trial_name": null,
232
  "trial_params": null
 
1
  {
2
  "best_metric": 0.4090208411216736,
3
  "best_model_checkpoint": "results/checkpoint-5000",
4
+ "epoch": 1.0429506020669386,
5
  "eval_steps": 500,
6
+ "global_step": 5500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
207
  "eval_samples_per_second": 57.28,
208
  "eval_steps_per_second": 0.45,
209
  "step": 5000
210
+ },
211
+ {
212
+ "epoch": 1.0429506020669386,
213
+ "grad_norm": 298623.21875,
214
+ "learning_rate": 9.569505025602126e-06,
215
+ "loss": 0.4332,
216
+ "step": 5500
217
+ },
218
+ {
219
+ "epoch": 1.0429506020669386,
220
+ "eval_accuracy": 0.8806597822531658,
221
+ "eval_f1_macro": 0.8501793427912383,
222
+ "eval_f1_w": 0.8820343950051113,
223
+ "eval_loss": 0.4112658202648163,
224
+ "eval_precision": 0.8853039418950968,
225
+ "eval_recall": 0.8806597822531658,
226
+ "eval_runtime": 377.6622,
227
+ "eval_samples_per_second": 56.667,
228
+ "eval_steps_per_second": 0.445,
229
+ "step": 5500
230
  }
231
  ],
232
  "logging_steps": 500,
 
246
  "attributes": {}
247
  }
248
  },
249
+ "total_flos": 1.8526799220115046e+17,
250
  "train_batch_size": 32,
251
  "trial_name": null,
252
  "trial_params": null