Training in progress, step 850000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Feb09_18-20-41_t1v-n-0cfb531e-w-0/events.out.tfevents.1675967137.t1v-n-0cfb531e-w-0.3767571.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0736aff937bc5cbe089a02ee96acafe29a3ce8b5ef41405f8f101efedc8d1867
 size 1475917081

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd4783c79d837195c8c28a24f0933d1e492e2e7dcaa298df4fb471ffea73d2a9
 size 1475917081

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a83020031862aea2e988f120ee4fbfdb9e36868ffeeee41e4196243bad5ad70f
 size 737971755

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a530a13febf37ee76db07823fcaf2dde21e0920e1af9b68cf155f551129662b
 size 737971755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea5f4d07228ced52baeea808cd24096aeb8c1e411df6d964bc2778cd1f37bff3
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c21fdf578f3ba8c419f0f122cdc5b04fd848666ce4f24ed13deaeeda0b66dba
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50e51b9224ded3ddffee57f26ec45414409de0232579ddafb7f3e083076fa4c5
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:adedebe0cc7e07de957a9e2967d6e9c3934a9fdca3245f46a29d125e5e36192e
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8,
-  "global_step": 800000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4934,11 +4934,319 @@
       "eval_samples_per_second": 241.45,
       "eval_steps_per_second": 1.932,
       "step": 800000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.34914183790592e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.85,
+  "global_step": 850000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 241.45,
       "eval_steps_per_second": 1.932,
       "step": 800000
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 1.0441632244932237e-05,
+      "loss": 0.7146,
+      "step": 801000
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 1.0340722563656107e-05,
+      "loss": 0.746,
+      "step": 802000
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 1.0240246589884044e-05,
+      "loss": 0.7146,
+      "step": 803000
+    },
+    {
+      "epoch": 0.8,
+      "learning_rate": 1.0140205422405214e-05,
+      "loss": 0.7564,
+      "step": 804000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 1.0040600155253765e-05,
+      "loss": 0.761,
+      "step": 805000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.941431877696955e-06,
+      "loss": 0.7907,
+      "step": 806000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.842701674223187e-06,
+      "loss": 0.7909,
+      "step": 807000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.744410624530148e-06,
+      "loss": 0.7931,
+      "step": 808000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.646559803512994e-06,
+      "loss": 0.7779,
+      "step": 809000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.549150281252633e-06,
+      "loss": 0.7252,
+      "step": 810000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.452183123004e-06,
+      "loss": 0.7497,
+      "step": 811000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.355659389184396e-06,
+      "loss": 0.7757,
+      "step": 812000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.259580135361929e-06,
+      "loss": 0.726,
+      "step": 813000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.163946412243896e-06,
+      "loss": 0.7048,
+      "step": 814000
+    },
+    {
+      "epoch": 0.81,
+      "learning_rate": 9.068759265665384e-06,
+      "loss": 0.681,
+      "step": 815000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.974019736577777e-06,
+      "loss": 0.7358,
+      "step": 816000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.879728861037384e-06,
+      "loss": 0.7676,
+      "step": 817000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.785887670194138e-06,
+      "loss": 0.7497,
+      "step": 818000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.692497190280224e-06,
+      "loss": 0.7809,
+      "step": 819000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.599558442598998e-06,
+      "loss": 0.8028,
+      "step": 820000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.507072443513702e-06,
+      "loss": 0.8323,
+      "step": 821000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.415040204436426e-06,
+      "loss": 0.8181,
+      "step": 822000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.323462731816961e-06,
+      "loss": 0.8814,
+      "step": 823000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.232341027131885e-06,
+      "loss": 0.829,
+      "step": 824000
+    },
+    {
+      "epoch": 0.82,
+      "learning_rate": 8.141676086873572e-06,
+      "loss": 0.7633,
+      "step": 825000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 8.051468902539272e-06,
+      "loss": 0.7566,
+      "step": 826000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.96172046062032e-06,
+      "loss": 0.7469,
+      "step": 827000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.872431742591268e-06,
+      "loss": 0.6765,
+      "step": 828000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.783603724899257e-06,
+      "loss": 0.7272,
+      "step": 829000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.695237378953223e-06,
+      "loss": 0.7554,
+      "step": 830000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.607333671113409e-06,
+      "loss": 0.7978,
+      "step": 831000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.519893562680663e-06,
+      "loss": 0.8094,
+      "step": 832000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.432918009885997e-06,
+      "loss": 0.786,
+      "step": 833000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.3464079638801365e-06,
+      "loss": 0.8359,
+      "step": 834000
+    },
+    {
+      "epoch": 0.83,
+      "learning_rate": 7.260364370723044e-06,
+      "loss": 0.862,
+      "step": 835000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 7.174788171373731e-06,
+      "loss": 0.8762,
+      "step": 836000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 7.089680301679752e-06,
+      "loss": 0.8808,
+      "step": 837000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 7.005041692367154e-06,
+      "loss": 0.8604,
+      "step": 838000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.92087326903022e-06,
+      "loss": 0.7643,
+      "step": 839000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.837175952121306e-06,
+      "loss": 0.7278,
+      "step": 840000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.753950656940905e-06,
+      "loss": 0.7171,
+      "step": 841000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.671198293627479e-06,
+      "loss": 0.6912,
+      "step": 842000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.588919767147639e-06,
+      "loss": 0.5905,
+      "step": 843000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.5071159772861436e-06,
+      "loss": 0.632,
+      "step": 844000
+    },
+    {
+      "epoch": 0.84,
+      "learning_rate": 6.425787818636131e-06,
+      "loss": 0.7451,
+      "step": 845000
+    },
+    {
+      "epoch": 0.85,
+      "learning_rate": 6.344936180589351e-06,
+      "loss": 0.7537,
+      "step": 846000
+    },
+    {
+      "epoch": 0.85,
+      "learning_rate": 6.264561947326331e-06,
+      "loss": 0.66,
+      "step": 847000
+    },
+    {
+      "epoch": 0.85,
+      "learning_rate": 6.184665997806832e-06,
+      "loss": 0.7213,
+      "step": 848000
+    },
+    {
+      "epoch": 0.85,
+      "learning_rate": 6.1052492057601275e-06,
+      "loss": 0.7708,
+      "step": 849000
+    },
+    {
+      "epoch": 0.85,
+      "learning_rate": 6.026312439675552e-06,
+      "loss": 0.8174,
+      "step": 850000
+    },
+    {
+      "epoch": 0.85,
+      "eval_loss": 0.5826455354690552,
+      "eval_runtime": 13.0928,
+      "eval_samples_per_second": 381.888,
+      "eval_steps_per_second": 3.055,
+      "step": 850000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.43346320277504e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a83020031862aea2e988f120ee4fbfdb9e36868ffeeee41e4196243bad5ad70f
 size 737971755

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a530a13febf37ee76db07823fcaf2dde21e0920e1af9b68cf155f551129662b
 size 737971755

runs/Feb09_18-20-41_t1v-n-0cfb531e-w-0/events.out.tfevents.1675967137.t1v-n-0cfb531e-w-0.3767571.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a89903c3ad93724a201222cc39ca9ad19e4291497e25d97bb164b6fca4688679
-size 12096

 version https://git-lfs.github.com/spec/v1
+oid sha256:bfabe543bd4f71179f1898ab0b35a69b1e7be998b3da381bc1404de8dd44afcf
+size 20372