Update tokenizer_config.json
#1
by
ybelkada
- opened
- tokenizer_config.json +1 -7
tokenizer_config.json
CHANGED
@@ -1,11 +1,5 @@
|
|
1 |
{
|
2 |
"added_tokens_decoder": {},
|
3 |
-
"auto_map": {
|
4 |
-
"AutoTokenizer": [
|
5 |
-
"THUDM/chatglm3-6b--tokenization_chatglm.ChatGLMTokenizer",
|
6 |
-
null
|
7 |
-
]
|
8 |
-
},
|
9 |
"chat_template": "{% for message in messages %}{% if loop.first %}[gMASK]sop<|{{ message['role'] }}|> \n {{ message['content'] }}{% else %}<|{{ message['role'] }}|> \n {{ message['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>{% endif %}",
|
10 |
"clean_up_tokenization_spaces": false,
|
11 |
"do_lower_case": false,
|
@@ -14,6 +8,6 @@
|
|
14 |
"pad_token": "<unk>",
|
15 |
"padding_side": "left",
|
16 |
"remove_space": false,
|
17 |
-
"tokenizer_class": "
|
18 |
"unk_token": "<unk>"
|
19 |
}
|
|
|
1 |
{
|
2 |
"added_tokens_decoder": {},
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
"chat_template": "{% for message in messages %}{% if loop.first %}[gMASK]sop<|{{ message['role'] }}|> \n {{ message['content'] }}{% else %}<|{{ message['role'] }}|> \n {{ message['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>{% endif %}",
|
4 |
"clean_up_tokenization_spaces": false,
|
5 |
"do_lower_case": false,
|
|
|
8 |
"pad_token": "<unk>",
|
9 |
"padding_side": "left",
|
10 |
"remove_space": false,
|
11 |
+
"tokenizer_class": "LlamaTokenizer",
|
12 |
"unk_token": "<unk>"
|
13 |
}
|