SpideyDLK commited on
Commit
b01b34b
1 Parent(s): 9c10562

Training in progress, step 22800, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:650fbf8d3ad6a937ad00b726e0e059fa5b0d4095b358ccb8b83b99d705d67f3a
3
  size 1262135480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a16074066d83775c4a17f83bfe52f28073ece39419bc4a2c1994d1e78611cd1
3
  size 1262135480
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b39a22fbed5001e0bf23ebb6e438a705bc06cdb375ddfc0ba39c29784850d050
3
  size 2490815798
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffdaa7ea99a7342739b3bc43c0b8e16b6c966f5fe52975037fac0a052ca78060
3
  size 2490815798
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09310d30ce2f1f65bdee86a47be5289ce008cf20400e5805ad00f3f50b144fbe
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c63df3feb106877a0c8b87b26e82b03b96040a2cc3e6b78b40ee9491bfeb2aba
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f68ad3f7fcdd16a1878b08fa3b7e4a910f778b64d8df6baad5daa110cbd65670
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:639e352d17a1224a5c4830a5109fe70a62931a8070aa98536eb532b2f173108d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 15.19674355495251,
5
  "eval_steps": 400,
6
- "global_step": 22400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -903,6 +903,22 @@
903
  "eval_steps_per_second": 0.83,
904
  "eval_wer": 0.05592358650439069,
905
  "step": 22400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
906
  }
907
  ],
908
  "logging_steps": 400,
@@ -910,7 +926,7 @@
910
  "num_input_tokens_seen": 0,
911
  "num_train_epochs": 30,
912
  "save_steps": 400,
913
- "total_flos": 6.831976523110607e+19,
914
  "train_batch_size": 8,
915
  "trial_name": null,
916
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.468113975576662,
5
  "eval_steps": 400,
6
+ "global_step": 22800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
903
  "eval_steps_per_second": 0.83,
904
  "eval_wer": 0.05592358650439069,
905
  "step": 22400
906
+ },
907
+ {
908
+ "epoch": 15.47,
909
+ "grad_norm": 0.4220418632030487,
910
+ "learning_rate": 0.00014698078682525158,
911
+ "loss": 0.0672,
912
+ "step": 22800
913
+ },
914
+ {
915
+ "epoch": 15.47,
916
+ "eval_loss": 0.030694805085659027,
917
+ "eval_runtime": 208.4031,
918
+ "eval_samples_per_second": 6.713,
919
+ "eval_steps_per_second": 0.84,
920
+ "eval_wer": 0.05345863503312279,
921
+ "step": 22800
922
  }
923
  ],
924
  "logging_steps": 400,
 
926
  "num_input_tokens_seen": 0,
927
  "num_train_epochs": 30,
928
  "save_steps": 400,
929
+ "total_flos": 6.954458728485663e+19,
930
  "train_batch_size": 8,
931
  "trial_name": null,
932
  "trial_params": null