Training in progress, epoch 1

Files changed (8) hide show

logs/events.out.tfevents.1719316225.49cbd00d2005.382.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:298724a4bb557672c166bc1e25254912866c59cdddf96831c2184896ca9bdd45
+size 5427

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4db5ce53872114bd04603e9f4cf8a2c9fff8b5eba2e6c35fa6175cd08190265
 size 17549312

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e4101e13540b9ca54dbd8ddf761e2b1b8af8108fb9147967fcd9ee7dd0b7ff1
 size 17549312

run-0/checkpoint-527/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3ae20a202c55d96dbc7a99eb68b3c49d5f2889c97c0f7b7581a4369c38393b73
 size 17549312

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e4101e13540b9ca54dbd8ddf761e2b1b8af8108fb9147967fcd9ee7dd0b7ff1
 size 17549312

run-0/checkpoint-527/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53a8520796ad50f6ff85e7e87d2a41102c44b1f2273e6444ae31344537166243
 size 35123898

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e154f8de5d1ef22d68e299790c35d542007a54f497034b3baf80de7e6bc91a6
 size 35123898

run-0/checkpoint-527/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e5d8781fb59c88c7bad07954373a93237cb20c6820b8da7eae26083a78c3d342
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:e79638116c39075972d1c173f673dfdcd1943140b9d4d46a92b6cd0538475b05
 size 1064

run-0/checkpoint-527/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.7672018348623854,
   "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-527",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -10,25 +10,25 @@
   "log_history": [
     {
       "epoch": 1.0,
-      "grad_norm": 12.377176284790039,
-      "learning_rate": 1.5980854192157344e-05,
-      "loss": 3.0218,
       "step": 527
     },
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.7672018348623854,
-      "eval_loss": 2.191861391067505,
-      "eval_runtime": 2.5906,
-      "eval_samples_per_second": 336.603,
-      "eval_steps_per_second": 2.702,
       "step": 527
     }
   ],
   "logging_steps": 500,
-  "max_steps": 3162,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 6,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -46,9 +46,9 @@
   "train_batch_size": 128,
   "trial_name": null,
   "trial_params": {
-    "alpha": 0.275210688972374,
-    "learning_rate": 1.9177025030588814e-05,
-    "num_train_epochs": 6,
     "temperature": 6
   }
 }

 {
+  "best_metric": 0.8176605504587156,
   "best_model_checkpoint": "tiny-bert-sst2-distilled/run-0/checkpoint-527",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 1.0,
+      "grad_norm": 15.690781593322754,
+      "learning_rate": 0.0004329892843734803,
+      "loss": 1.29,
       "step": 527
     },
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.8176605504587156,
+      "eval_loss": 1.5847134590148926,
+      "eval_runtime": 2.4131,
+      "eval_samples_per_second": 361.36,
+      "eval_steps_per_second": 2.901,
       "step": 527
     }
   ],
   "logging_steps": 500,
+  "max_steps": 2108,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
   "train_batch_size": 128,
   "trial_name": null,
   "trial_params": {
+    "alpha": 0.19981548442581198,
+    "learning_rate": 0.000577319045831307,
+    "num_train_epochs": 4,
     "temperature": 6
   }
 }

run-0/checkpoint-527/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:15e7b4feae857373f91378a3d0efc15d0ec396bfba71e74c965086843aa6acf4
 size 5176

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b553ab9101fed6c5a9e75fca4cb81df81514d2d3f8ff94edc0c546949c119f9
 size 5176

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee9990afd96f204321e9e33fc4071f73d76355111015fd2ec723f4a4e4849ce7
 size 5176

 version https://git-lfs.github.com/spec/v1
+oid sha256:9b553ab9101fed6c5a9e75fca4cb81df81514d2d3f8ff94edc0c546949c119f9
 size 5176