Training in progress, step 70, checkpoint

Browse files

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +63 -3

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:376a3d27f0b1944494854ef53f3cae507ae395c3d1eb4a9fb04b4918e1482b14
 size 83945296

 version https://git-lfs.github.com/spec/v1
+oid sha256:98f4c3613d0942e1149efb5ec951f878e656ab8598ea1d74c4e1cc2f71b54b60
 size 83945296

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a66101811aa26237703ee0b600450fa3d9faaa7c72ad1d2093f56e124c8dd86
 size 42545748

 version https://git-lfs.github.com/spec/v1
+oid sha256:d2ee711433e187c4c3ef92ebe11a92651d96a20e76be34859e3f9387f5d9e8a5
 size 42545748

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:babf9cef0f970e1cd241f9533a5b0bc052a39fc9df617e7f31209a9691bd42d1
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:557e474a226d303e26d6758a2eb18bb0bbe3b1a451146f9953c40e79b727f273
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:87f5541cd8b8cc2355cb28b7b43b87c2e735f1841d8477f8ed4c15392845734c
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:1723a4b1c943236de3935bcf77e35b80aec5d8ffd41a734f2052202a2aabea88
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.024,
   "eval_steps": 1000,
-  "global_step": 60,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -367,13 +367,73 @@
       "learning_rate": 8.421052631578948e-05,
       "loss": 1.6805,
       "step": 60
     }
   ],
   "logging_steps": 1,
   "max_steps": 100,
   "num_train_epochs": 1,
   "save_steps": 10,
-  "total_flos": 3532725037301760.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.028,
   "eval_steps": 1000,
+  "global_step": 70,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 8.421052631578948e-05,
       "loss": 1.6805,
       "step": 60
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 8.210526315789474e-05,
+      "loss": 1.8059,
+      "step": 61
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 8e-05,
+      "loss": 1.6999,
+      "step": 62
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 7.789473684210526e-05,
+      "loss": 1.7289,
+      "step": 63
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 7.578947368421054e-05,
+      "loss": 1.395,
+      "step": 64
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 7.368421052631579e-05,
+      "loss": 1.5194,
+      "step": 65
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 7.157894736842105e-05,
+      "loss": 1.9656,
+      "step": 66
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 6.947368421052632e-05,
+      "loss": 1.7048,
+      "step": 67
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 6.736842105263159e-05,
+      "loss": 1.5836,
+      "step": 68
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 6.526315789473685e-05,
+      "loss": 1.7741,
+      "step": 69
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 6.31578947368421e-05,
+      "loss": 1.7412,
+      "step": 70
     }
   ],
   "logging_steps": 1,
   "max_steps": 100,
   "num_train_epochs": 1,
   "save_steps": 10,
+  "total_flos": 4233108315045888.0,
   "trial_name": null,
   "trial_params": null
 }