bobox commited on
Commit
c80f3ed
·
verified ·
1 Parent(s): 3f21601

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -563,6 +563,10 @@ You can finetune this model on your own dataset.
563
  | 3.4871 | 1624 | 1.9654 | 0.2392 | 1.5037 |
564
  | 3.7371 | 1740 | 2.1107 | 0.2234 | 1.4557 |
565
  | 3.9871 | 1856 | 2.0709 | 0.2094 | 1.4287 |
 
 
 
 
566
 
567
 
568
  ### Framework Versions
 
563
  | 3.4871 | 1624 | 1.9654 | 0.2392 | 1.5037 |
564
  | 3.7371 | 1740 | 2.1107 | 0.2234 | 1.4557 |
565
  | 3.9871 | 1856 | 2.0709 | 0.2094 | 1.4287 |
566
+ | 4.2328 | 1972 | 1.9489 | 0.2072 | 1.4167 |
567
+ | 4.4828 | 2088 | 1.8238 | 0.2019 | 1.4155 |
568
+ | 4.7328 | 2204 | 2.1587 | 0.2005 | 1.4136 |
569
+ | 4.9828 | 2320 | 1.929 | 0.2005 | 1.4132 |
570
 
571
 
572
  ### Framework Versions
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45eeac36057b0a84a3d410d1974ea4ef60e1f6732308a7c19c7fd4aa6ff3adf0
3
  size 1130520122
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2415efd86ddb31b8ccd116ba8fb00cf3a2bb32e6d5d2ef1d307b59571c494cb5
3
  size 1130520122
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5df76c36ed895286d93c7e35de2022f1a4142ca300d68137813a64ef7c2467b2
3
  size 565251810
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa6de6db3864cbe5490abac662a29ae3c7a4c0dce0a1063f4172a3ba474b3b0e
3
  size 565251810
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23ac986d8316aed04b3cf90a12a44166385897956e05972f0500d5a12c28b4e2
3
  size 14180
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee7def8d6e19abe0010fc23ee8ceef6f2e3224be5f40cd1c4f4ae996d6eab300
3
  size 14180
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c4113c75337369f487518d15e4b953b9a64a66968b355fbea0722908652f445
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d07db50179fc1817acd2aeda9c1e69355a330f49f4a4908ab69b93d19e89e01
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.004310344827586,
5
  "eval_steps": 116,
6
- "global_step": 1864,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -375,6 +375,98 @@
375
  "eval_qnli-contrastive_samples_per_second": 1383.695,
376
  "eval_qnli-contrastive_steps_per_second": 86.481,
377
  "step": 1856
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
378
  }
379
  ],
380
  "logging_steps": 116,
@@ -389,7 +481,7 @@
389
  "should_evaluate": false,
390
  "should_log": false,
391
  "should_save": true,
392
- "should_training_stop": false
393
  },
394
  "attributes": {}
395
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.982758620689655,
5
  "eval_steps": 116,
6
+ "global_step": 2320,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
375
  "eval_qnli-contrastive_samples_per_second": 1383.695,
376
  "eval_qnli-contrastive_steps_per_second": 86.481,
377
  "step": 1856
378
+ },
379
+ {
380
+ "epoch": 4.232758620689655,
381
+ "grad_norm": 4.497424602508545,
382
+ "learning_rate": 3.680019472369961e-07,
383
+ "loss": 1.9489,
384
+ "step": 1972
385
+ },
386
+ {
387
+ "epoch": 4.232758620689655,
388
+ "eval_nli-pairs_loss": 1.4166995286941528,
389
+ "eval_nli-pairs_runtime": 1.3578,
390
+ "eval_nli-pairs_samples_per_second": 1472.956,
391
+ "eval_nli-pairs_steps_per_second": 92.06,
392
+ "step": 1972
393
+ },
394
+ {
395
+ "epoch": 4.232758620689655,
396
+ "eval_qnli-contrastive_loss": 0.2071654498577118,
397
+ "eval_qnli-contrastive_runtime": 1.489,
398
+ "eval_qnli-contrastive_samples_per_second": 1343.182,
399
+ "eval_qnli-contrastive_steps_per_second": 83.949,
400
+ "step": 1972
401
+ },
402
+ {
403
+ "epoch": 4.482758620689655,
404
+ "grad_norm": 8.940858840942383,
405
+ "learning_rate": 1.7030146916085187e-07,
406
+ "loss": 1.8238,
407
+ "step": 2088
408
+ },
409
+ {
410
+ "epoch": 4.482758620689655,
411
+ "eval_nli-pairs_loss": 1.4154555797576904,
412
+ "eval_nli-pairs_runtime": 1.4109,
413
+ "eval_nli-pairs_samples_per_second": 1417.564,
414
+ "eval_nli-pairs_steps_per_second": 88.598,
415
+ "step": 2088
416
+ },
417
+ {
418
+ "epoch": 4.482758620689655,
419
+ "eval_qnli-contrastive_loss": 0.20185217261314392,
420
+ "eval_qnli-contrastive_runtime": 1.4817,
421
+ "eval_qnli-contrastive_samples_per_second": 1349.799,
422
+ "eval_qnli-contrastive_steps_per_second": 84.362,
423
+ "step": 2088
424
+ },
425
+ {
426
+ "epoch": 4.732758620689655,
427
+ "grad_norm": 4.952300548553467,
428
+ "learning_rate": 4.5391654754460885e-08,
429
+ "loss": 2.1587,
430
+ "step": 2204
431
+ },
432
+ {
433
+ "epoch": 4.732758620689655,
434
+ "eval_nli-pairs_loss": 1.4136021137237549,
435
+ "eval_nli-pairs_runtime": 1.3576,
436
+ "eval_nli-pairs_samples_per_second": 1473.214,
437
+ "eval_nli-pairs_steps_per_second": 92.076,
438
+ "step": 2204
439
+ },
440
+ {
441
+ "epoch": 4.732758620689655,
442
+ "eval_qnli-contrastive_loss": 0.20051518082618713,
443
+ "eval_qnli-contrastive_runtime": 1.585,
444
+ "eval_qnli-contrastive_samples_per_second": 1261.81,
445
+ "eval_qnli-contrastive_steps_per_second": 78.863,
446
+ "step": 2204
447
+ },
448
+ {
449
+ "epoch": 4.982758620689655,
450
+ "grad_norm": 10.16062068939209,
451
+ "learning_rate": 1.1034588846758897e-10,
452
+ "loss": 1.929,
453
+ "step": 2320
454
+ },
455
+ {
456
+ "epoch": 4.982758620689655,
457
+ "eval_nli-pairs_loss": 1.4131741523742676,
458
+ "eval_nli-pairs_runtime": 1.2998,
459
+ "eval_nli-pairs_samples_per_second": 1538.653,
460
+ "eval_nli-pairs_steps_per_second": 96.166,
461
+ "step": 2320
462
+ },
463
+ {
464
+ "epoch": 4.982758620689655,
465
+ "eval_qnli-contrastive_loss": 0.2004699856042862,
466
+ "eval_qnli-contrastive_runtime": 1.449,
467
+ "eval_qnli-contrastive_samples_per_second": 1380.303,
468
+ "eval_qnli-contrastive_steps_per_second": 86.269,
469
+ "step": 2320
470
  }
471
  ],
472
  "logging_steps": 116,
 
481
  "should_evaluate": false,
482
  "should_log": false,
483
  "should_save": true,
484
+ "should_training_stop": true
485
  },
486
  "attributes": {}
487
  }