k4black commited on
Commit
8f64d91
·
1 Parent(s): f4bf108

Training in progress, step 13500

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bda6d8b01959de39ba727cf65ebf1679bca33d79e28f75e3c9a93b97bde2d98
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c0d147d71a96c906ebb0826962404c68767b66a0beb6d79026300f3e2c851f2
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35737dd63de8dd15a434463f352af1ca13361ec6ad940d8d6d57c02ca720a0c5
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf876759e8b11d059f8734bc8687b6651bb5e3dc1523d1e7b3e7cf51f75bd7ea
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec1d572066a975cce68a6728c4924f1ce1aa043904ec8fb9bf914cc37f8ce9ef
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dca6aa856e22896a84db27110c95826c10ec6824e6ff17f27e272f65e365a925
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f897fc5ea9ff3f8b4c69087123f7b049e20d61b25538299e1d2d1327ed7be47
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1649df062a4967a054ab70170e4b975014ed744f851c13b8199f78139481d1e6
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:752a70445102b249f7f99549c9b0595ef63200e880c377bf3d80c443b9f54831
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cf1cde2626062aa08cd0c52d9866007bfb16a0d69ae902e25110edb2f03d0e2
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.7575966715812683,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
- "epoch": 4.16,
5
- "global_step": 13000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -500,11 +500,30 @@
500
  "eval_samples_per_second": 82.695,
501
  "eval_steps_per_second": 2.605,
502
  "step": 13000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
503
  }
504
  ],
505
  "max_steps": 31250,
506
  "num_train_epochs": 10,
507
- "total_flos": 4.693192667037696e+16,
508
  "trial_name": null,
509
  "trial_params": null
510
  }
 
1
  {
2
  "best_metric": 0.7575966715812683,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-12000",
4
+ "epoch": 4.32,
5
+ "global_step": 13500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
500
  "eval_samples_per_second": 82.695,
501
  "eval_steps_per_second": 2.605,
502
  "step": 13000
503
+ },
504
+ {
505
+ "epoch": 4.32,
506
+ "learning_rate": 5.981069154848924e-05,
507
+ "loss": 0.443,
508
+ "step": 13500
509
+ },
510
+ {
511
+ "epoch": 4.32,
512
+ "eval_bleu": 0.13844237313177618,
513
+ "eval_exact_match": 0.163,
514
+ "eval_loss": 0.7602689266204834,
515
+ "eval_rouge1": 0.5739436350821147,
516
+ "eval_rouge2": 0.4082942402749472,
517
+ "eval_rougeL": 0.5570060194504324,
518
+ "eval_runtime": 21.9206,
519
+ "eval_samples_per_second": 91.238,
520
+ "eval_steps_per_second": 2.874,
521
+ "step": 13500
522
  }
523
  ],
524
  "max_steps": 31250,
525
  "num_train_epochs": 10,
526
+ "total_flos": 4.874625964887245e+16,
527
  "trial_name": null,
528
  "trial_params": null
529
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35737dd63de8dd15a434463f352af1ca13361ec6ad940d8d6d57c02ca720a0c5
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf876759e8b11d059f8734bc8687b6651bb5e3dc1523d1e7b3e7cf51f75bd7ea
3
  size 242019067