Training in progress, step 500, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed724931d80c25381a64aa1ce3cd3545067e5f55c974d2c2c95b6d39556703db
 size 12609416

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a484c67a7b85e5b5d8597ba20eb01fac01ceeb14985bd4c60caa3ee28a4fad1
 size 12609416

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d31eaf664d2efa4551079992f3a6db42b7be0f1151bc448f3c8eefea5285d4fc
 size 6615226

 version https://git-lfs.github.com/spec/v1
+oid sha256:a722bbae0d2ef3f7353b097bd1a45aff136a61bb588ae1cc739d062c715df5d0
 size 6615226

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e968442ee43cc742af32185068f114d6a1ad5f422b5dcbf2d21fb0dfd6ffb875
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:d456150d273def7b6aef58ff01646b7bb689c6c947da8898e5d6caf60a79b2a4
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fe3012fb121cd84e6e41f718fd33de9e34ed33145ada7b055f7e25e49408431d
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:71a96715f430c2eb0d6104363f54769b2c1bdb005671dc81f0d67833a84ba743
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-  "best_metric": 1.4858981370925903,
-  "best_model_checkpoint": "miner_id_24/checkpoint-450",
-  "epoch": 0.1913672124176058,
   "eval_steps": 50,
-  "global_step": 450,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -150,6 +150,21 @@
       "eval_samples_per_second": 59.639,
       "eval_steps_per_second": 14.94,
       "step": 450
     }
   ],
   "logging_steps": 50,
@@ -173,12 +188,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 5964283930214400.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 1.4820817708969116,
+  "best_model_checkpoint": "miner_id_24/checkpoint-500",
+  "epoch": 0.212630236019562,
   "eval_steps": 50,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 59.639,
       "eval_steps_per_second": 14.94,
       "step": 450
+    },
+    {
+      "epoch": 0.212630236019562,
+      "grad_norm": 3.2577598094940186,
+      "learning_rate": 0.0,
+      "loss": 2.9982,
+      "step": 500
+    },
+    {
+      "epoch": 0.212630236019562,
+      "eval_loss": 1.4820817708969116,
+      "eval_runtime": 16.6053,
+      "eval_samples_per_second": 59.62,
+      "eval_steps_per_second": 14.935,
+      "step": 500
     }
   ],
   "logging_steps": 50,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 6613636428595200.0,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null