AlexHT_Hung commited on
Commit
8ca4fd7
Β·
1 Parent(s): 806da72

add <|func_start|>

Browse files
added_tokens.json CHANGED
@@ -1,6 +1,4 @@
1
  {
2
- "</s>": 2,
3
- "<s>": 1,
4
- "<unk>": 0,
5
- "<|func_end|>": 36128
6
  }
 
1
  {
2
+ "<|func_end|>": 36128,
3
+ "<|func_start|>": 36129
 
 
4
  }
special_tokens_map.json CHANGED
@@ -4,8 +4,32 @@
4
  "<s>",
5
  "</s>"
6
  ],
7
- "bos_token": "<s>",
8
- "eos_token": "</s>",
9
- "pad_token": "<unk>",
10
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  }
 
4
  "<s>",
5
  "</s>"
6
  ],
7
+ "bos_token": {
8
+ "content": "<s>",
9
+ "lstrip": false,
10
+ "normalized": false,
11
+ "rstrip": false,
12
+ "single_word": false
13
+ },
14
+ "eos_token": {
15
+ "content": "</s>",
16
+ "lstrip": false,
17
+ "normalized": false,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "pad_token": {
22
+ "content": "<unk>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false
27
+ },
28
+ "unk_token": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false
34
+ }
35
  }
tokenizer.json CHANGED
@@ -38,6 +38,15 @@
38
  "rstrip": true,
39
  "normalized": false,
40
  "special": false
 
 
 
 
 
 
 
 
 
41
  }
42
  ],
43
  "normalizer": {
@@ -97525,4 +97534,4 @@
97525
  "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁"
97526
  ]
97527
  }
97528
- }
 
38
  "rstrip": true,
39
  "normalized": false,
40
  "special": false
41
+ },
42
+ {
43
+ "id": 36129,
44
+ "content": "<|func_start|>",
45
+ "single_word": true,
46
+ "lstrip": true,
47
+ "rstrip": true,
48
+ "normalized": false,
49
+ "special": false
50
  }
51
  ],
52
  "normalizer": {
 
97534
  "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁"
97535
  ]
97536
  }
97537
+ }
tokenizer_config.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
@@ -31,6 +33,14 @@
31
  "rstrip": true,
32
  "single_word": true,
33
  "special": false
 
 
 
 
 
 
 
 
34
  }
35
  },
36
  "additional_special_tokens": [
 
1
  {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
  "added_tokens_decoder": {
5
  "0": {
6
  "content": "<unk>",
 
33
  "rstrip": true,
34
  "single_word": true,
35
  "special": false
36
+ },
37
+ "36129": {
38
+ "content": "<|func_start|>",
39
+ "lstrip": true,
40
+ "normalized": false,
41
+ "rstrip": true,
42
+ "single_word": true,
43
+ "special": false
44
  }
45
  },
46
  "additional_special_tokens": [