NuExtract-large / tokenizer_config.json
Alexandre-Numind's picture
Upload tokenizer
a0bd67f verified
raw
history blame contribute delete
672 Bytes
{
"_commit_hash": null,
"_from_auto": true,
"added_tokens_decoder": {},
"auto_map": {
"AutoTokenizer": [
"tokenization_phi3_small.Phi3SmallTokenizer",
null
]
},
"bos_token": "<|endoftext|>",
"chat_template": "{{ bos_token }}{% for message in messages %}{{'<|' + message['role'] + '|>' + '\n' + message['content'] + '<|end|>\n' }}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ eos_token }}{% endif %}",
"clean_up_tokenization_spaces": true,
"eos_token": "<|endoftext|>",
"model_max_length": 8192,
"pad_token": "<|endoftext|>",
"tokenizer_class": "Phi3SmallTokenizer",
"trust_remote_code": true
}