cxrmate / tokenizer_config.json
anicolson's picture
Upload tokenizer
16f5e77
raw
history blame
433 Bytes
{
"additional_special_tokens": [
"[NF]",
"[NI]",
"[PMT]",
"[PMT-SEP]",
"[NPF]",
"[NPI]"
],
"bos_token": "[BOS]",
"clean_up_tokenization_spaces": true,
"cls_token": "[BOS]",
"eos_token": "[EOS]",
"mask_token": "[MASK]",
"model_max_length": 1000000000000000019884624838656,
"pad_token": "[PAD]",
"sep_token": "[SEP]",
"tokenizer_class": "PreTrainedTokenizerFast",
"unk_token": "[UNK]"
}