Model save

Files changed (9) hide show

added_tokens.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
-  "<|EOS|>": 50257,
-  "<|pad|>": 50258
 }

 {
+  "<BOS>": 50258,
+  "<EOS>": 50257,
+  "<PAD>": 50259
 }

all_results.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-    "epoch": 5.0,
     "eval_loss": 3.2769460678100586,
     "eval_runtime": 0.5905,
     "eval_samples_per_second": 491.113,
     "eval_steps_per_second": 62.659,
-    "total_flos": 44318598912000.0,
-    "train_loss": 1.5727621986126077,
-    "train_runtime": 87.1353,
-    "train_samples_per_second": 66.448,
-    "train_steps_per_second": 8.32
 }

 {
+    "epoch": 3.0,
     "eval_loss": 3.2769460678100586,
     "eval_runtime": 0.5905,
     "eval_samples_per_second": 491.113,
     "eval_steps_per_second": 62.659,
+    "total_flos": 26593608960000.0,
+    "train_loss": 1.7656888413703304,
+    "train_runtime": 41.7769,
+    "train_samples_per_second": 83.156,
+    "train_steps_per_second": 10.412
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2261767a7c661cbc5040a7aa15933c31969986abd6988edd50b3f83e89c0d693
 size 510407229

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ef762aaffe86533871d820480043529a4cc2d54a0563a4642562790f988ae03
 size 510407229

runs/Jan08_19-07-15_f279fa53eed4/1673204875.0088935/events.out.tfevents.1673204875.f279fa53eed4.755.17 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2adb9ba590463f25f1f5ef577ac8ec04e2962c722bef3af9228babdc4c1a72b
+size 5615

runs/Jan08_19-07-15_f279fa53eed4/events.out.tfevents.1673204875.f279fa53eed4.755.16 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c7f0d57ba33a5375ee80117f5e5dcbf31698bdd8927af8ab9c55930fa6e9276
+size 4420

special_tokens_map.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
-  "bos_token": "<|endoftext|>",
-  "eos_token": "<|EOS|>",
-  "pad_token": "<|pad|>",
   "unk_token": "<|endoftext|>"
 }

 {
+  "bos_token": "<BOS>",
+  "eos_token": "<EOS>",
+  "pad_token": "<PAD>",
   "unk_token": "<|endoftext|>"
 }

tokenizer.json CHANGED Viewed

@@ -2,17 +2,19 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 15,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
-    "strategy": "BatchLongest",
     "direction": "Right",
     "pad_to_multiple_of": null,
-    "pad_id": 50258,
     "pad_type_id": 0,
-    "pad_token": "<|pad|>"
   },
   "added_tokens": [
     {
@@ -26,7 +28,7 @@
     },
     {
       "id": 50257,
-      "content": "<|EOS|>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
@@ -35,7 +37,16 @@
     },
     {
       "id": 50258,
-      "content": "<|pad|>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 7,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
+    "strategy": {
+      "Fixed": 7
+    },
     "direction": "Right",
     "pad_to_multiple_of": null,
+    "pad_id": 50259,
     "pad_type_id": 0,
+    "pad_token": "<PAD>"
   },
   "added_tokens": [
     {
     },
     {
       "id": 50257,
+      "content": "<EOS>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
     },
     {
       "id": 50258,
+      "content": "<BOS>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 50259,
+      "content": "<PAD>",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-    "epoch": 5.0,
-    "total_flos": 44318598912000.0,
-    "train_loss": 1.5727621986126077,
-    "train_runtime": 87.1353,
-    "train_samples_per_second": 66.448,
-    "train_steps_per_second": 8.32
 }

 {
+    "epoch": 3.0,
+    "total_flos": 26593608960000.0,
+    "train_loss": 1.7656888413703304,
+    "train_runtime": 41.7769,
+    "train_samples_per_second": 83.156,
+    "train_steps_per_second": 10.412
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eea3c7e4745d28b3ad1f42a6eb51f4f2252fd2c4335e4b1d459ca9106e6cba6b
 size 3515

 version https://git-lfs.github.com/spec/v1
+oid sha256:017544b9ce38ff4743efad99daada086efa61588a4a1bbae834380310ad8fa6c
 size 3515