SystemAdmin123 commited on
Commit
c94f50d
·
verified ·
1 Parent(s): 5d0cebd

Training in progress, step 320, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b02f3bea30ba5f4000f2757ed1fa28858b738010261b54d239d104557caaaf1
3
  size 136062744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7632ba1b08e41a9688dc652015271c5554d97ca9c7a3699508fa42877e5f157f
3
  size 136062744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf4819b116e20e0cf6edb7b9a514d0c38a1681ed9fb664e8b1387fb6e27e99ca
3
  size 272133812
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2a4f822a3e0dfeabb1f9b45e30eea832fd24d20337f8008cdf4a3cc28b90b13
3
  size 272133812
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a021bf8fc1bd19adcc1376dcee299d8a04aa1a7952251bad1e317521748875b7
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85dd38c6cdc192788a99895f3084ff7dbd3299b657e7e5a24e6ed465f9344b6a
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:972bd8028f20fce3573923f9a005027e0d260b48904a7835117b203b223afc00
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d4cb67e36f2b83aebca6d9cfc2016780d42e305cfdcda7c59d7e83846c493f9
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:346eed5082d2ec3cd3b01057d77087e12608217fe1db4e2cc48a1c635d2b350f
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a256cde06a990790428bb39e3cafeb2de78bab76c12cd4e277082638050d6136
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8617efc3472b5b019323214ba6f5ff8db4e44b4f8dae20eed03655cbbbdeade
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f056289e15f55441b8e468a55ec32f1a2b7873d4c0b0e58213f81abf037a634
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b57d29062e2b005ef9338306d164f8255bdbae7cde6979cc3c6601ddda4f3ab8
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8c207fa1f410f5283ce28d883ff8a114b142d07980cca571866b27f63ca8f99
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a7294aa3359669dd9326bd90c9c9925cb82746ef54c24e800e87f0555b79b28
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07d4cbf9fa98068d1cc83eaeae8931895e6a693ef1347a3dcc43ea278a4fd3e5
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:712c430310813615c3ea651f2526c9d2f01c1c820ddb6bf6771a7983456fddf7
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:756c6f30b0c1263bcdec8435dcac3071f9f0d1b0de426bda07a81d2e513ee832
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b34f186dd0d24d76f54563508cd3f031ee1155efb43c5a5a9cfcc9ce2e166bce
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31d40be02311ba43d019df6bdd117f385db008c5f96585c2f8a8e46f02a4a82c
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f71fff5908e20a1b3137a87f6a31d497f79c8c2b801a7eea008ae86f7863417
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13ba300eb50af5f07dfdf5f9c8ec3b31766e55d5d321cd8570f14309b439775d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.2843601895734595,
5
  "eval_steps": 200,
6
- "global_step": 280,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -219,6 +219,34 @@
219
  "learning_rate": 0.00019649409730077935,
220
  "loss": 1.7822,
221
  "step": 280
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
222
  }
223
  ],
224
  "logging_steps": 10,
@@ -238,7 +266,7 @@
238
  "attributes": {}
239
  }
240
  },
241
- "total_flos": 3.810376470757376e+16,
242
  "train_batch_size": 1,
243
  "trial_name": null,
244
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.037914691943128,
5
  "eval_steps": 200,
6
+ "global_step": 320,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
219
  "learning_rate": 0.00019649409730077935,
220
  "loss": 1.7822,
221
  "step": 280
222
+ },
223
+ {
224
+ "epoch": 5.4739336492890995,
225
+ "grad_norm": 6.0,
226
+ "learning_rate": 0.000196145982960926,
227
+ "loss": 1.5687,
228
+ "step": 290
229
+ },
230
+ {
231
+ "epoch": 5.6635071090047395,
232
+ "grad_norm": 1.8359375,
233
+ "learning_rate": 0.00019578173241879872,
234
+ "loss": 1.7941,
235
+ "step": 300
236
+ },
237
+ {
238
+ "epoch": 5.8530805687203795,
239
+ "grad_norm": 1.6875,
240
+ "learning_rate": 0.00019540140680664913,
241
+ "loss": 1.7871,
242
+ "step": 310
243
+ },
244
+ {
245
+ "epoch": 6.037914691943128,
246
+ "grad_norm": 1.4921875,
247
+ "learning_rate": 0.0001950050699546116,
248
+ "loss": 1.7118,
249
+ "step": 320
250
  }
251
  ],
252
  "logging_steps": 10,
 
266
  "attributes": {}
267
  }
268
  },
269
+ "total_flos": 4.353739574791373e+16,
270
  "train_batch_size": 1,
271
  "trial_name": null,
272
  "trial_params": null