bodo-pos-gpt2-fine-tune / tokenizer_config.json
Sanjib Narzary
GPT2 fine tune on bodo pos data
8e1e807
raw
history blame
261 Bytes
{
"add_prefix_space": true,
"clean_up_tokenization_spaces": true,
"model_max_length": 512,
"special_tokens": [
"<s>",
"<pad>",
"</s>",
"<unk>",
"<cls>",
"<sep>",
"<mask>"
],
"tokenizer_class": "PreTrainedTokenizerFast"
}