SpideyDLK commited on
Commit
5447491
1 Parent(s): 9ed6451

Training in progress, step 29200, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2685df91b0212c3d771f740af7d493329819e9ece934c6572ec91f4ac11a64ea
3
  size 1262135480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fe283633a388ba2d022ff9f5bd22a4410a9ce61cf5ab36a933f8316c404dc0d
3
  size 1262135480
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f33961fae286f63a4d7d03dcc99f6908f11c6a773bd2e93e0e7d4d192962b30a
3
  size 2490815798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ffc119225525035a7f335e5b8efd08e194472d357b13852524d4f4eb0578b80
3
  size 2490815798
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd07cca9b4e51cb881f8cba86aaed9cb56420ad7f452f9d07931ab907d7921d1
3
- size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d853691023356ee049c7f9520a152041301e582ba9494903ecaa091cb4963f6
3
+ size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb762c3231bb27770a54b360094bd1e9cd8e02cdf5dec63794e81b5cd90258bf
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76c2f43626453dc6c68d43c01f88ecb4cc62eda02fd56285615f23696dcf1415
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 19.53867028493894,
5
  "eval_steps": 400,
6
- "global_step": 28800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1159,6 +1159,22 @@
1159
  "eval_steps_per_second": 0.833,
1160
  "eval_wer": 0.04190417501155446,
1161
  "step": 28800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1162
  }
1163
  ],
1164
  "logging_steps": 400,
@@ -1166,7 +1182,7 @@
1166
  "num_input_tokens_seen": 0,
1167
  "num_train_epochs": 30,
1168
  "save_steps": 400,
1169
- "total_flos": 8.781106063335208e+19,
1170
  "train_batch_size": 8,
1171
  "trial_name": null,
1172
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 19.810040705563093,
5
  "eval_steps": 400,
6
+ "global_step": 29200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1159
  "eval_steps_per_second": 0.833,
1160
  "eval_wer": 0.04190417501155446,
1161
  "step": 28800
1162
+ },
1163
+ {
1164
+ "epoch": 19.81,
1165
+ "grad_norm": 0.6549252271652222,
1166
+ "learning_rate": 0.00010306495882891125,
1167
+ "loss": 0.0454,
1168
+ "step": 29200
1169
+ },
1170
+ {
1171
+ "epoch": 19.81,
1172
+ "eval_loss": 0.027856331318616867,
1173
+ "eval_runtime": 210.3168,
1174
+ "eval_samples_per_second": 6.652,
1175
+ "eval_steps_per_second": 0.832,
1176
+ "eval_wer": 0.04167308581112309,
1177
+ "step": 29200
1178
  }
1179
  ],
1180
  "logging_steps": 400,
 
1182
  "num_input_tokens_seen": 0,
1183
  "num_train_epochs": 30,
1184
  "save_steps": 400,
1185
+ "total_flos": 8.903221408478038e+19,
1186
  "train_batch_size": 8,
1187
  "trial_name": null,
1188
  "trial_params": null