Oriya
sentencepiece
File size: 248 Bytes
d530982
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
{
  "tokenizer_class": "PreTrainedTokenizerFast",
  "model_type": "sentencepiece",
  "vocab_size": 50000,
  "unk_token": "<unk>",
  "bos_token": "<s>",
  "eos_token": "</s>",
  "pad_token": "<pad>",
  "sp_model_file": "odia_tokenizers_test.model"
}