Model save

Files changed (6) hide show

all_results.json CHANGED Viewed

@@ -6,8 +6,8 @@
     "eval_samples_per_second": 13.325,
     "eval_steps_per_second": 1.777,
     "total_flos": 9299872197181440.0,
-    "train_loss": 2.0597532987594604,
-    "train_runtime": 8.5801,
-    "train_samples_per_second": 13.986,
-    "train_steps_per_second": 1.865
 }

     "eval_samples_per_second": 13.325,
     "eval_steps_per_second": 1.777,
     "total_flos": 9299872197181440.0,
+    "train_loss": 2.0122132897377014,
+    "train_runtime": 8.9154,
+    "train_samples_per_second": 13.46,
+    "train_steps_per_second": 1.795
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1a37fbaf95e6d2d4d0fdbfb0b3d339567b9b60312f68de65369294ce33eaba30
 size 343254736

 version https://git-lfs.github.com/spec/v1
+oid sha256:29e9ae72ffd7850be2a3b0dc5e74cce7d8e8fec4f531471a799d02a828b580ca
 size 343254736

runs/Mar22_10-48-55_X5C922065N/events.out.tfevents.1711100937.X5C922065N.52576.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9965efa251dc18aab5e56bc52fd656a67f314c22657383795610bda4f69be548
+size 6113

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 4.0,
     "total_flos": 9299872197181440.0,
-    "train_loss": 2.0597532987594604,
-    "train_runtime": 8.5801,
-    "train_samples_per_second": 13.986,
-    "train_steps_per_second": 1.865
 }

 {
     "epoch": 4.0,
     "total_flos": 9299872197181440.0,
+    "train_loss": 2.0122132897377014,
+    "train_runtime": 8.9154,
+    "train_samples_per_second": 13.46,
+    "train_steps_per_second": 1.795
 }

trainer_state.json CHANGED Viewed

@@ -10,19 +10,19 @@
   "log_history": [
     {
       "epoch": 2.5,
-      "grad_norm": 2.4165334701538086,
       "learning_rate": 7.500000000000001e-05,
-      "loss": 2.2555,
       "step": 10
     },
     {
       "epoch": 4.0,
       "step": 16,
       "total_flos": 9299872197181440.0,
-      "train_loss": 2.0597532987594604,
-      "train_runtime": 8.5801,
-      "train_samples_per_second": 13.986,
-      "train_steps_per_second": 1.865
     }
   ],
   "logging_steps": 10,

   "log_history": [
     {
       "epoch": 2.5,
+      "grad_norm": 2.5313448905944824,
       "learning_rate": 7.500000000000001e-05,
+      "loss": 2.2157,
       "step": 10
     },
     {
       "epoch": 4.0,
       "step": 16,
       "total_flos": 9299872197181440.0,
+      "train_loss": 2.0122132897377014,
+      "train_runtime": 8.9154,
+      "train_samples_per_second": 13.46,
+      "train_steps_per_second": 1.795
     }
   ],
   "logging_steps": 10,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3b866bf7e7002388dfcff6dcdf79fba35279dfbdb28c9f35e0cf98af2540d619
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:5986e60995f0b4a642b5145e8844c9037ab084eecbe52c98b6672614af74fed9
 size 4920