SpideyDLK commited on
Commit
9898088
1 Parent(s): 8b93c6c

Training in progress, step 29600, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fe283633a388ba2d022ff9f5bd22a4410a9ce61cf5ab36a933f8316c404dc0d
3
  size 1262135480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e63f877c4506681a490774017678ec3ddaf77e75d1e84f86025ada6590efbd8
3
  size 1262135480
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ffc119225525035a7f335e5b8efd08e194472d357b13852524d4f4eb0578b80
3
  size 2490815798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ff96e9d8d8bd2f41f071244c4ff2909a15f3a277d70d0f48e2c1231181b87b5
3
  size 2490815798
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d853691023356ee049c7f9520a152041301e582ba9494903ecaa091cb4963f6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32ab7f10ca6b13468e41de24a05121a51b38477fe4c9a87064b918ea752578ac
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76c2f43626453dc6c68d43c01f88ecb4cc62eda02fd56285615f23696dcf1415
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:940d3836b6775a577a1a3b78f4ff4621e538b7a2a81b57676d7aecf40e93b414
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 19.810040705563093,
5
  "eval_steps": 400,
6
- "global_step": 29200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1175,6 +1175,22 @@
1175
  "eval_steps_per_second": 0.832,
1176
  "eval_wer": 0.04167308581112309,
1177
  "step": 29200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1178
  }
1179
  ],
1180
  "logging_steps": 400,
@@ -1182,7 +1198,7 @@
1182
  "num_input_tokens_seen": 0,
1183
  "num_train_epochs": 30,
1184
  "save_steps": 400,
1185
- "total_flos": 8.903221408478038e+19,
1186
  "train_batch_size": 8,
1187
  "trial_name": null,
1188
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 20.081411126187245,
5
  "eval_steps": 400,
6
+ "global_step": 29600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1175
  "eval_steps_per_second": 0.832,
1176
  "eval_wer": 0.04167308581112309,
1177
  "step": 29200
1178
+ },
1179
+ {
1180
+ "epoch": 20.08,
1181
+ "grad_norm": 7.543890953063965,
1182
+ "learning_rate": 0.00010032021957913997,
1183
+ "loss": 0.0483,
1184
+ "step": 29600
1185
+ },
1186
+ {
1187
+ "epoch": 20.08,
1188
+ "eval_loss": 0.025978881865739822,
1189
+ "eval_runtime": 210.6554,
1190
+ "eval_samples_per_second": 6.641,
1191
+ "eval_steps_per_second": 0.831,
1192
+ "eval_wer": 0.0395932830072408,
1193
+ "step": 29600
1194
  }
1195
  ],
1196
  "logging_steps": 400,
 
1198
  "num_input_tokens_seen": 0,
1199
  "num_train_epochs": 30,
1200
  "save_steps": 400,
1201
+ "total_flos": 9.027987196010655e+19,
1202
  "train_batch_size": 8,
1203
  "trial_name": null,
1204
  "trial_params": null