Training in progress, step 200000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Feb16_16-14-57_t1v-n-eeadb94b-w-0/events.out.tfevents.1676564607.t1v-n-eeadb94b-w-0.3898595.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e2eb45535e100aeb2e53731922f2dfe2348f199f7f9c5f250e255442e6e5514c
 size 2693742553

 version https://git-lfs.github.com/spec/v1
+oid sha256:8da94f9b90f1ba4c0d3164e62b77b676f2b235652f6f692114e1b2bdb5273523
 size 2693742553

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6caf4b5ebffdcb04f4fec8820e2a50cd7e7dada8bbf5818d249024f9b029b50f
 size 1346893675

 version https://git-lfs.github.com/spec/v1
+oid sha256:de8a4f7df26972b1c1fe1546343f51ae325d6a1916a83baac53a80c81d4dd4ce
 size 1346893675

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63ae91a2fec6011908bf6cd9856e3a511813695d55eb3a0fc1be3c461ba6b8e1
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:c5a9eaaa7cc088403f9a31ab70b2e1791d125e5bf39dbc05085cce4adba73595
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04ad030a150fa0d8eb5e5920300951e9645dc85319159f9dd4f177aff4c5b722
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:be1ccf49f4804619cd7d22b74b595a694a368e629a10492b4089d6536d07bdf2
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.15,
-  "global_step": 150000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -930,11 +930,319 @@
       "eval_samples_per_second": 219.028,
       "eval_steps_per_second": 3.461,
       "step": 150000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 8.9474847473664e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2,
+  "global_step": 200000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 219.028,
       "eval_steps_per_second": 3.461,
       "step": 150000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.723691552302562e-05,
+      "loss": 0.7738,
+      "step": 151000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.718245238567939e-05,
+      "loss": 0.7963,
+      "step": 152000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.712747326859315e-05,
+      "loss": 0.8171,
+      "step": 153000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.707197877300974e-05,
+      "loss": 0.8773,
+      "step": 154000
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 9.701596950580806e-05,
+      "loss": 0.9735,
+      "step": 155000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.695944607949649e-05,
+      "loss": 0.8433,
+      "step": 156000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.690240911220618e-05,
+      "loss": 0.8706,
+      "step": 157000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.684485922768422e-05,
+      "loss": 0.7855,
+      "step": 158000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.6786797055287e-05,
+      "loss": 0.785,
+      "step": 159000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.672822322997305e-05,
+      "loss": 0.765,
+      "step": 160000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.66691383922964e-05,
+      "loss": 0.7384,
+      "step": 161000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.660954318839933e-05,
+      "loss": 0.7583,
+      "step": 162000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.654943827000548e-05,
+      "loss": 0.7785,
+      "step": 163000
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 9.648882429441257e-05,
+      "loss": 0.8002,
+      "step": 164000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.642770192448536e-05,
+      "loss": 0.8721,
+      "step": 165000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.636607182864827e-05,
+      "loss": 0.9439,
+      "step": 166000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.630393468087818e-05,
+      "loss": 0.8458,
+      "step": 167000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.624129116069694e-05,
+      "loss": 0.8241,
+      "step": 168000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.617814195316411e-05,
+      "loss": 0.7928,
+      "step": 169000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.611448774886924e-05,
+      "loss": 0.7656,
+      "step": 170000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.605032924392457e-05,
+      "loss": 0.7647,
+      "step": 171000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.598566713995718e-05,
+      "loss": 0.7523,
+      "step": 172000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.59205021441015e-05,
+      "loss": 0.7739,
+      "step": 173000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.58548349689915e-05,
+      "loss": 0.7857,
+      "step": 174000
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 9.578866633275288e-05,
+      "loss": 0.8132,
+      "step": 175000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.572199695899522e-05,
+      "loss": 0.8928,
+      "step": 176000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.565482757680415e-05,
+      "loss": 0.9479,
+      "step": 177000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.558715892073323e-05,
+      "loss": 0.8774,
+      "step": 178000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.551899173079607e-05,
+      "loss": 0.7822,
+      "step": 179000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.545032675245813e-05,
+      "loss": 0.7981,
+      "step": 180000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.538116473662861e-05,
+      "loss": 0.7582,
+      "step": 181000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.531150643965223e-05,
+      "loss": 0.7543,
+      "step": 182000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.524135262330098e-05,
+      "loss": 0.741,
+      "step": 183000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.517070405476575e-05,
+      "loss": 0.7712,
+      "step": 184000
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 9.509956150664796e-05,
+      "loss": 0.7824,
+      "step": 185000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.502792575695112e-05,
+      "loss": 0.8096,
+      "step": 186000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.49557975890723e-05,
+      "loss": 0.9033,
+      "step": 187000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.488317779179361e-05,
+      "loss": 0.9156,
+      "step": 188000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.481006715927351e-05,
+      "loss": 0.896,
+      "step": 189000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.473646649103818e-05,
+      "loss": 0.7307,
+      "step": 190000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.46623765919727e-05,
+      "loss": 0.8032,
+      "step": 191000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.458779827231237e-05,
+      "loss": 0.7586,
+      "step": 192000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.451273234763371e-05,
+      "loss": 0.7422,
+      "step": 193000
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 9.443717963884569e-05,
+      "loss": 0.7412,
+      "step": 194000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.43611409721806e-05,
+      "loss": 0.7738,
+      "step": 195000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.428461717918511e-05,
+      "loss": 0.7806,
+      "step": 196000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.420760909671118e-05,
+      "loss": 0.807,
+      "step": 197000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.413011756690685e-05,
+      "loss": 0.9269,
+      "step": 198000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.405214343720707e-05,
+      "loss": 0.8776,
+      "step": 199000
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 9.397368756032445e-05,
+      "loss": 0.8979,
+      "step": 200000
+    },
+    {
+      "epoch": 0.2,
+      "eval_loss": 0.7604823112487793,
+      "eval_runtime": 22.7684,
+      "eval_samples_per_second": 219.603,
+      "eval_steps_per_second": 3.47,
+      "step": 200000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.19299796631552e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6caf4b5ebffdcb04f4fec8820e2a50cd7e7dada8bbf5818d249024f9b029b50f
 size 1346893675

 version https://git-lfs.github.com/spec/v1
+oid sha256:de8a4f7df26972b1c1fe1546343f51ae325d6a1916a83baac53a80c81d4dd4ce
 size 1346893675

runs/Feb16_16-14-57_t1v-n-eeadb94b-w-0/events.out.tfevents.1676564607.t1v-n-eeadb94b-w-0.3898595.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb0e9ec09f3b51afd6a302351e1087f71bcce087680397c33de7d54dcab01d36
-size 20388

 version https://git-lfs.github.com/spec/v1
+oid sha256:c86b06d1f8b18603f6ddeb5deb090948c3af173dea2f1dfd9bac06ba2cfd7d88
+size 28664