Training in progress, step 800

Browse files

Files changed (10) hide show

{checkpoint-500 → checkpoint-800}/config.json +0 -0
{checkpoint-500 → checkpoint-800}/optimizer.pt +1 -1
{checkpoint-500 → checkpoint-800}/preprocessor_config.json +0 -0
{checkpoint-500 → checkpoint-800}/pytorch_model.bin +1 -1
{checkpoint-500 → checkpoint-800}/rng_state.pth +1 -1
{checkpoint-500 → checkpoint-800}/scaler.pt +1 -1
{checkpoint-500 → checkpoint-800}/scheduler.pt +1 -1
{checkpoint-500 → checkpoint-800}/trainer_state.json +120 -3
{checkpoint-500 → checkpoint-800}/training_args.bin +0 -0
pytorch_model.bin +1 -1

{checkpoint-500 → checkpoint-800}/config.json RENAMED Viewed

File without changes

{checkpoint-500 → checkpoint-800}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f4f451d7dca685dc733896a3b9dde8e1707a70872842fb140a7b1b2bc09dc86e
 size 2490337809

 version https://git-lfs.github.com/spec/v1
+oid sha256:d3228c2d654fd3d25a0ad00a301f5ce6f4265d0cc4c922a869f44a37a2b0f0f2
 size 2490337809

{checkpoint-500 → checkpoint-800}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-500 → checkpoint-800}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee400442c70fe28b4032830f08f4c31605f74d5b5778895b5f30b7cad432bdcd
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:83f2151485570eebb9c2c7ead79b5dbb947c911745136ec08aec4531150fc59d
 size 1262063089

{checkpoint-500 → checkpoint-800}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:60bd99fb8f131eb1ec63d9b9eee304bd3aa49c3b43a3a12613b8de4c1d42c4c6
 size 14567

 version https://git-lfs.github.com/spec/v1
+oid sha256:191ab0b0b7f850bd200dd0e9733735c31b1e7d63b3150165c4de6c4a12c5ef5e
 size 14567

{checkpoint-500 → checkpoint-800}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4fa4c7be44c959599b8b43bb9bc3371e9e4e5bbc5758b3ab5afcccfda3e72e67
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c2074cdcefbaa0a39f736d6b0f7bf018c350d49e85648bc8accc4f756ad816e
 size 559

{checkpoint-500 → checkpoint-800}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:536ace7f76d669d6713c8de85eb8de0ed71bdc66a4ba89707e46295a79ac66a8
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:595ce5051ecea72321f0a4e15d7e1d59293398355f90dbde31fcccb29f2b4f95
 size 623

{checkpoint-500 → checkpoint-800}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.491803278688525,
-  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -201,11 +201,128 @@
       "eval_steps_per_second": 0.796,
       "eval_wer": 1.0,
       "step": 500
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
-  "total_flos": 7.741689365780442e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 8.78688524590164,
+  "global_step": 800,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.796,
       "eval_wer": 1.0,
       "step": 500
+    },
+    {
+      "epoch": 5.71,
+      "learning_rate": 6.500000000000001e-05,
+      "loss": 3.0088,
+      "step": 520
+    },
+    {
+      "epoch": 5.93,
+      "learning_rate": 6.75e-05,
+      "loss": 3.0051,
+      "step": 540
+    },
+    {
+      "epoch": 6.15,
+      "learning_rate": 7.000000000000001e-05,
+      "loss": 3.073,
+      "step": 560
+    },
+    {
+      "epoch": 6.37,
+      "learning_rate": 7.25e-05,
+      "loss": 3.0031,
+      "step": 580
+    },
+    {
+      "epoch": 6.59,
+      "learning_rate": 7.5e-05,
+      "loss": 2.9964,
+      "step": 600
+    },
+    {
+      "epoch": 6.59,
+      "eval_loss": 2.998962640762329,
+      "eval_runtime": 193.5213,
+      "eval_samples_per_second": 25.026,
+      "eval_steps_per_second": 0.785,
+      "eval_wer": 1.0,
+      "step": 600
+    },
+    {
+      "epoch": 6.81,
+      "learning_rate": 7.75e-05,
+      "loss": 2.9921,
+      "step": 620
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 8e-05,
+      "loss": 3.0665,
+      "step": 640
+    },
+    {
+      "epoch": 7.25,
+      "learning_rate": 8.25e-05,
+      "loss": 2.9826,
+      "step": 660
+    },
+    {
+      "epoch": 7.47,
+      "learning_rate": 8.5e-05,
+      "loss": 2.9689,
+      "step": 680
+    },
+    {
+      "epoch": 7.69,
+      "learning_rate": 8.75e-05,
+      "loss": 2.9602,
+      "step": 700
+    },
+    {
+      "epoch": 7.69,
+      "eval_loss": 2.9620397090911865,
+      "eval_runtime": 193.5851,
+      "eval_samples_per_second": 25.017,
+      "eval_steps_per_second": 0.785,
+      "eval_wer": 1.0,
+      "step": 700
+    },
+    {
+      "epoch": 7.91,
+      "learning_rate": 8.999999999999999e-05,
+      "loss": 2.9639,
+      "step": 720
+    },
+    {
+      "epoch": 8.13,
+      "learning_rate": 9.25e-05,
+      "loss": 3.0215,
+      "step": 740
+    },
+    {
+      "epoch": 8.35,
+      "learning_rate": 9.5e-05,
+      "loss": 2.9454,
+      "step": 760
+    },
+    {
+      "epoch": 8.57,
+      "learning_rate": 9.750000000000001e-05,
+      "loss": 2.9239,
+      "step": 780
+    },
+    {
+      "epoch": 8.79,
+      "learning_rate": 0.0001,
+      "loss": 2.8756,
+      "step": 800
+    },
+    {
+      "epoch": 8.79,
+      "eval_loss": 2.7302000522613525,
+      "eval_runtime": 191.8065,
+      "eval_samples_per_second": 25.249,
+      "eval_steps_per_second": 0.792,
+      "eval_wer": 1.0,
+      "step": 800
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
+  "total_flos": 1.2402928809554872e+19,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-500 → checkpoint-800}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:866e0246bd78706b1bfb6c07818d34662e459927e54718460f8a950f5fc33ae8
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:83f2151485570eebb9c2c7ead79b5dbb947c911745136ec08aec4531150fc59d
 size 1262063089