jonra1993 commited on
Commit
c2fc522
·
1 Parent(s): 802ca46

Model save

Browse files
added_tokens.json CHANGED
@@ -1,4 +1,5 @@
1
  {
2
- "<|EOS|>": 50257,
3
- "<|pad|>": 50258
 
4
  }
 
1
  {
2
+ "<BOS>": 50258,
3
+ "<EOS>": 50257,
4
+ "<PAD>": 50259
5
  }
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 5.0,
3
  "eval_loss": 3.2769460678100586,
4
  "eval_runtime": 0.5905,
5
  "eval_samples_per_second": 491.113,
6
  "eval_steps_per_second": 62.659,
7
- "total_flos": 44318598912000.0,
8
- "train_loss": 1.5727621986126077,
9
- "train_runtime": 87.1353,
10
- "train_samples_per_second": 66.448,
11
- "train_steps_per_second": 8.32
12
  }
 
1
  {
2
+ "epoch": 3.0,
3
  "eval_loss": 3.2769460678100586,
4
  "eval_runtime": 0.5905,
5
  "eval_samples_per_second": 491.113,
6
  "eval_steps_per_second": 62.659,
7
+ "total_flos": 26593608960000.0,
8
+ "train_loss": 1.7656888413703304,
9
+ "train_runtime": 41.7769,
10
+ "train_samples_per_second": 83.156,
11
+ "train_steps_per_second": 10.412
12
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2261767a7c661cbc5040a7aa15933c31969986abd6988edd50b3f83e89c0d693
3
  size 510407229
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ef762aaffe86533871d820480043529a4cc2d54a0563a4642562790f988ae03
3
  size 510407229
runs/Jan08_19-07-15_f279fa53eed4/1673204875.0088935/events.out.tfevents.1673204875.f279fa53eed4.755.17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2adb9ba590463f25f1f5ef577ac8ec04e2962c722bef3af9228babdc4c1a72b
3
+ size 5615
runs/Jan08_19-07-15_f279fa53eed4/events.out.tfevents.1673204875.f279fa53eed4.755.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c7f0d57ba33a5375ee80117f5e5dcbf31698bdd8927af8ab9c55930fa6e9276
3
+ size 4420
special_tokens_map.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|EOS|>",
4
- "pad_token": "<|pad|>",
5
  "unk_token": "<|endoftext|>"
6
  }
 
1
  {
2
+ "bos_token": "<BOS>",
3
+ "eos_token": "<EOS>",
4
+ "pad_token": "<PAD>",
5
  "unk_token": "<|endoftext|>"
6
  }
tokenizer.json CHANGED
@@ -2,17 +2,19 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 15,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
- "strategy": "BatchLongest",
 
 
11
  "direction": "Right",
12
  "pad_to_multiple_of": null,
13
- "pad_id": 50258,
14
  "pad_type_id": 0,
15
- "pad_token": "<|pad|>"
16
  },
17
  "added_tokens": [
18
  {
@@ -26,7 +28,7 @@
26
  },
27
  {
28
  "id": 50257,
29
- "content": "<|EOS|>",
30
  "single_word": false,
31
  "lstrip": false,
32
  "rstrip": false,
@@ -35,7 +37,16 @@
35
  },
36
  {
37
  "id": 50258,
38
- "content": "<|pad|>",
 
 
 
 
 
 
 
 
 
39
  "single_word": false,
40
  "lstrip": false,
41
  "rstrip": false,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 7,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
+ "strategy": {
11
+ "Fixed": 7
12
+ },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
15
+ "pad_id": 50259,
16
  "pad_type_id": 0,
17
+ "pad_token": "<PAD>"
18
  },
19
  "added_tokens": [
20
  {
 
28
  },
29
  {
30
  "id": 50257,
31
+ "content": "<EOS>",
32
  "single_word": false,
33
  "lstrip": false,
34
  "rstrip": false,
 
37
  },
38
  {
39
  "id": 50258,
40
+ "content": "<BOS>",
41
+ "single_word": false,
42
+ "lstrip": false,
43
+ "rstrip": false,
44
+ "normalized": false,
45
+ "special": true
46
+ },
47
+ {
48
+ "id": 50259,
49
+ "content": "<PAD>",
50
  "single_word": false,
51
  "lstrip": false,
52
  "rstrip": false,
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 5.0,
3
- "total_flos": 44318598912000.0,
4
- "train_loss": 1.5727621986126077,
5
- "train_runtime": 87.1353,
6
- "train_samples_per_second": 66.448,
7
- "train_steps_per_second": 8.32
8
  }
 
1
  {
2
+ "epoch": 3.0,
3
+ "total_flos": 26593608960000.0,
4
+ "train_loss": 1.7656888413703304,
5
+ "train_runtime": 41.7769,
6
+ "train_samples_per_second": 83.156,
7
+ "train_steps_per_second": 10.412
8
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eea3c7e4745d28b3ad1f42a6eb51f4f2252fd2c4335e4b1d459ca9106e6cba6b
3
  size 3515
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:017544b9ce38ff4743efad99daada086efa61588a4a1bbae834380310ad8fa6c
3
  size 3515