ngwgsang commited on
Commit
0174f50
·
verified ·
1 Parent(s): 8100c96

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6abbe53ad4bdac2acb6b66d420455cd29cb6827b7c717226acf69fa003615a2
3
  size 526442440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d31a90689bda13906c3d2b9014cf0f03ffe475ca00bd46cc5a89ef704c269aa2
3
  size 526442440
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb66437cd1a1f3e85d760dae4101799dad85f6d2f44db58e8d2447de6ae42cdf
3
  size 1052723962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba95173fda6e5cd98497f7c742e0d43e56efc23513b8f1b8c8542a823a06881f
3
  size 1052723962
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90e807d11977312b0373d61c5dd72b09e491f95b6790237c43c227444a908b23
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b4628423d479157682a147c925ad8913f28124292218dbe5f25553313c28d24
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79a65e50ebd7c88e6afe05bce60e1437447659f0ab3d763f77217140057a93ad
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7eaa191070e51793fbf344cd35501716ecc7578f20c1ced375c0d7bb5bee549
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.37554213404655457,
3
  "best_model_checkpoint": "./vit5_qqp/checkpoint-863",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 863,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -22,6 +22,28 @@
22
  "eval_samples_per_second": 536.767,
23
  "eval_steps_per_second": 13.443,
24
  "step": 863
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
  "logging_steps": 500,
@@ -41,7 +63,7 @@
41
  "attributes": {}
42
  }
43
  },
44
- "total_flos": 821883496366080.0,
45
  "train_batch_size": 40,
46
  "trial_name": null,
47
  "trial_params": null
 
1
  {
2
  "best_metric": 0.37554213404655457,
3
  "best_model_checkpoint": "./vit5_qqp/checkpoint-863",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 1726,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
22
  "eval_samples_per_second": 536.767,
23
  "eval_steps_per_second": 13.443,
24
  "step": 863
25
+ },
26
+ {
27
+ "epoch": 1.1587485515643106,
28
+ "grad_norm": 1.1074819564819336,
29
+ "learning_rate": 3.0687524140594824e-05,
30
+ "loss": 0.2304,
31
+ "step": 1000
32
+ },
33
+ {
34
+ "epoch": 1.7381228273464657,
35
+ "grad_norm": 1.0999990701675415,
36
+ "learning_rate": 2.103128621089224e-05,
37
+ "loss": 0.1765,
38
+ "step": 1500
39
+ },
40
+ {
41
+ "epoch": 2.0,
42
+ "eval_loss": 0.3892330229282379,
43
+ "eval_runtime": 40.1411,
44
+ "eval_samples_per_second": 537.155,
45
+ "eval_steps_per_second": 13.453,
46
+ "step": 1726
47
  }
48
  ],
49
  "logging_steps": 500,
 
63
  "attributes": {}
64
  }
65
  },
66
+ "total_flos": 1643766992732160.0,
67
  "train_batch_size": 40,
68
  "trial_name": null,
69
  "trial_params": null