SpideyDLK commited on
Commit
4c71070
1 Parent(s): ab633b2

Training in progress, step 30800, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b633a636ea01455d95405d2e7b2e68f22243db2a95c2ae32b4cbef581ddbdd59
3
  size 1262135480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f03d9c4dc9c893251efad1bc77811226da4c4437220f84146189aacc8379d6a
3
  size 1262135480
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:769c9a68ca83d6a5f45ce1b0ac12927d2eeea29b91278cdd3d6c171f5494dfc8
3
  size 2490815798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2e73cccc71ac85f330e4ec678e7034ca077c18833bc67911a068fb1452dd155
3
  size 2490815798
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ae6e534def4a67be8922488d0e357ecaf484f188a6c773ca4a58237b636f659
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84e13a4f3a8f7d56afd0f5f975612b4b8f9aa823d2e1d66e0bd153a61bf80520
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8f18eb855b7b39022ee052bd24985576b865c272695e8bedc0f3c7cee91e9b4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ec9c887ded84c0bb967a2d484366bc8237e2095772e8fe2c5537450af655bae
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 20.624151967435548,
5
  "eval_steps": 400,
6
- "global_step": 30400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1223,6 +1223,22 @@
1223
  "eval_steps_per_second": 0.8,
1224
  "eval_wer": 0.03728239100292713,
1225
  "step": 30400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1226
  }
1227
  ],
1228
  "logging_steps": 400,
@@ -1230,7 +1246,7 @@
1230
  "num_input_tokens_seen": 0,
1231
  "num_train_epochs": 21,
1232
  "save_steps": 400,
1233
- "total_flos": 9.273468143459728e+19,
1234
  "train_batch_size": 8,
1235
  "trial_name": null,
1236
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 20.895522388059703,
5
  "eval_steps": 400,
6
+ "global_step": 30800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1223
  "eval_steps_per_second": 0.8,
1224
  "eval_wer": 0.03728239100292713,
1225
  "step": 30400
1226
+ },
1227
+ {
1228
+ "epoch": 20.9,
1229
+ "grad_norm": 0.5151128172874451,
1230
+ "learning_rate": 1.5170420962763511e-06,
1231
+ "loss": 0.0409,
1232
+ "step": 30800
1233
+ },
1234
+ {
1235
+ "epoch": 20.9,
1236
+ "eval_loss": 0.02457941137254238,
1237
+ "eval_runtime": 218.4572,
1238
+ "eval_samples_per_second": 6.404,
1239
+ "eval_steps_per_second": 0.801,
1240
+ "eval_wer": 0.03666615313511015,
1241
+ "step": 30800
1242
  }
1243
  ],
1244
  "logging_steps": 400,
 
1246
  "num_input_tokens_seen": 0,
1247
  "num_train_epochs": 21,
1248
  "save_steps": 400,
1249
+ "total_flos": 9.394928547856309e+19,
1250
  "train_batch_size": 8,
1251
  "trial_name": null,
1252
  "trial_params": null