Training in progress, step 20000

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +72 -3
pytorch_model.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ab515e1fe640432722359a2c1b73c30cb1877b811da7dd7eb4d12a0264d38ca7
 size 1668076741

 version https://git-lfs.github.com/spec/v1
+oid sha256:291f9655e8deedacd6ba5d051af226c4cb8ebd7310cc9e38474e2a0f61b6d10e
 size 1668076741

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a6b694759ac2afff917fcdce63156bddf5fee0be806cea69404c4a6ae5f6230
 size 834053717

 version https://git-lfs.github.com/spec/v1
+oid sha256:abbe85aaf27562d1d64f10fe9cebefd891fb599fac4d07e142f8b427c63c674d
 size 834053717

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1a4769972fb7cd6e12627b484967936feb779148fd2d15221e6fc67a874d999b
 size 15597

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f5b5027ca54bd16ebf7bcd1124e301f3adcb854fc2dbe6bf992e7e1ea1ae077
 size 15597

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0909b42e35569611bafb37fd33209cd6a86113e40deac3fa1da41689cd651093
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:0876994cba4fff49c925c2a122534ea9fff9a44c01c8ac7813ec4131482c3100
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6bf931b79849e3c5ce67ad727efd02c50905b3121a21823c140a392dee34ce6e
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:32d54ab2a4c0dda7883ab94b84e46d25097c34cdf01933d23db795cca974f4ce
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.2,
-  "global_step": 10000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -75,11 +75,80 @@
       "eval_samples_per_second": 41.069,
       "eval_steps_per_second": 2.571,
       "step": 10000
     }
   ],
   "max_steps": 50000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 6.7342134411264e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.4,
+  "global_step": 20000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 41.069,
       "eval_steps_per_second": 2.571,
       "step": 10000
+    },
+    {
+      "epoch": 0.22,
+      "learning_rate": 2.7697770521953444e-05,
+      "loss": 0.8444,
+      "step": 11000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 2.714224866611362e-05,
+      "loss": 0.7575,
+      "step": 12000
+    },
+    {
+      "epoch": 0.26,
+      "learning_rate": 2.6533631846300875e-05,
+      "loss": 0.7919,
+      "step": 13000
+    },
+    {
+      "epoch": 0.28,
+      "learning_rate": 2.587458138901327e-05,
+      "loss": 0.833,
+      "step": 14000
+    },
+    {
+      "epoch": 0.3,
+      "learning_rate": 2.516797915421335e-05,
+      "loss": 0.8335,
+      "step": 15000
+    },
+    {
+      "epoch": 0.32,
+      "learning_rate": 2.4416914933687753e-05,
+      "loss": 0.8382,
+      "step": 16000
+    },
+    {
+      "epoch": 0.34,
+      "learning_rate": 2.3624672940173894e-05,
+      "loss": 0.8253,
+      "step": 17000
+    },
+    {
+      "epoch": 0.36,
+      "learning_rate": 2.27947174463333e-05,
+      "loss": 0.8442,
+      "step": 18000
+    },
+    {
+      "epoch": 0.38,
+      "learning_rate": 2.193067763636869e-05,
+      "loss": 0.8794,
+      "step": 19000
+    },
+    {
+      "epoch": 0.4,
+      "learning_rate": 2.1036331736524874e-05,
+      "loss": 0.8631,
+      "step": 20000
+    },
+    {
+      "epoch": 0.4,
+      "eval_accuracy": 0.855058580917128,
+      "eval_loss": 0.6343714594841003,
+      "eval_runtime": 151.1949,
+      "eval_samples_per_second": 33.07,
+      "eval_steps_per_second": 2.07,
+      "step": 20000
     }
   ],
   "max_steps": 50000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.34684268822528e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a6b694759ac2afff917fcdce63156bddf5fee0be806cea69404c4a6ae5f6230
 size 834053717

 version https://git-lfs.github.com/spec/v1
+oid sha256:abbe85aaf27562d1d64f10fe9cebefd891fb599fac4d07e142f8b427c63c674d
 size 834053717