Younes Belkada
commited on
Commit
·
1d7b146
1
Parent(s):
dc5e103
add tokenizer
Browse files- special_tokens_map.json +1 -0
- spiece.model +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +1 -0
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
|
spiece.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5cbdfa8aa7c54c8c5af85b78c309c54a5f2749a20468bf6f60eee007fe6fec1
|
3 |
+
size 805634
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "[PAD]", "extra_ids": 0, "additional_special_tokens": [], "bos_token": "<s>", "cls_token": "[CLS]", "sep_token": "[SEP]", "mask_token": "[MASK]", "do_lower_case": true, "special_tokens_map_file": "/root/.cache/huggingface/transformers/b5690eac5a5e74c1002160161ad9a816835ff9bb3cc2db4b61d0fba5d14b9a5b.9049458ebcd1cf666b7b0a046aa394597f12e611077571cfc86e0938f8675d82", "name_or_path": "rinna/japanese-roberta-base", "sp_model_kwargs": {}, "tokenizer_class": "T5Tokenizer"}
|