update

Files changed (6) hide show

README.md DELETED Viewed

	@@ -1 +0,0 @@
1	- mbert-argument-mining-es

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.2825497290938373,
-    "train_runtime": 130.292,
-    "train_samples": 4405,
-    "train_samples_per_second": 101.426,
-    "train_steps_per_second": 6.355
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.24564219588448766,
+    "train_runtime": 262.0679,
+    "train_samples": 8808,
+    "train_samples_per_second": 100.829,
+    "train_steps_per_second": 6.308
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b98906def43a21275da98472d2ecf560cc290a2e7fcbef119eee61b4420310d
 size 709090132

 version https://git-lfs.github.com/spec/v1
+oid sha256:d88e185b8f01e5d7aff8d660772f93e7497df7ea384348229e5a140bbc692235
 size 709090132

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.2825497290938373,
-    "train_runtime": 130.292,
-    "train_samples": 4405,
-    "train_samples_per_second": 101.426,
-    "train_steps_per_second": 6.355
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.24564219588448766,
+    "train_runtime": 262.0679,
+    "train_samples": 8808,
+    "train_samples_per_second": 100.829,
+    "train_steps_per_second": 6.308
 }

trainer_state.json CHANGED Viewed

@@ -3,33 +3,45 @@
   "best_model_checkpoint": null,
   "epoch": 3.0,
   "eval_steps": 500,
-  "global_step": 828,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 1.81,
-      "learning_rate": 1.9806763285024154e-05,
-      "loss": 0.3629,
       "step": 500
     },
     {
       "epoch": 3.0,
-      "step": 828,
-      "total_flos": 739078528656780.0,
-      "train_loss": 0.2825497290938373,
-      "train_runtime": 130.292,
-      "train_samples_per_second": 101.426,
-      "train_steps_per_second": 6.355
     }
   ],
   "logging_steps": 500,
-  "max_steps": 828,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 739078528656780.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

   "best_model_checkpoint": null,
   "epoch": 3.0,
   "eval_steps": 500,
+  "global_step": 1653,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.91,
+      "learning_rate": 3.487598306110103e-05,
+      "loss": 0.4056,
       "step": 500
     },
+    {
+      "epoch": 1.81,
+      "learning_rate": 1.975196612220206e-05,
+      "loss": 0.2455,
+      "step": 1000
+    },
+    {
+      "epoch": 2.72,
+      "learning_rate": 4.627949183303086e-06,
+      "loss": 0.1298,
+      "step": 1500
+    },
     {
       "epoch": 3.0,
+      "step": 1653,
+      "total_flos": 1395101222261760.0,
+      "train_loss": 0.24564219588448766,
+      "train_runtime": 262.0679,
+      "train_samples_per_second": 100.829,
+      "train_steps_per_second": 6.308
     }
   ],
   "logging_steps": 500,
+  "max_steps": 1653,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
+  "total_flos": 1395101222261760.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ad3b261ba9512d1ea5f688672dc310df685d90c435dad4b05f113db6468be4c3
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:de11250632abb8e8078d16652e77145ac8ead77ea6eca4e95f9eb9fc9d3743bf
 size 4664