best model, 7K steps
Browse files- tokenizer_config.json +3 -3
tokenizer_config.json
CHANGED
@@ -105,13 +105,13 @@
|
|
105 |
"clean_up_tokenization_spaces": true,
|
106 |
"eos_token": "</s>",
|
107 |
"language_codes": "m2m100",
|
108 |
-
"model_max_length":
|
109 |
"num_madeup_words": 8,
|
110 |
"pad_token": "<pad>",
|
111 |
"sep_token": "</s>",
|
112 |
"sp_model_kwargs": {},
|
113 |
-
"src_lang":
|
114 |
-
"tgt_lang":
|
115 |
"tokenizer_class": "M2M100Tokenizer",
|
116 |
"tokenizer_file": null,
|
117 |
"unk_token": "<unk>"
|
|
|
105 |
"clean_up_tokenization_spaces": true,
|
106 |
"eos_token": "</s>",
|
107 |
"language_codes": "m2m100",
|
108 |
+
"model_max_length": 1024,
|
109 |
"num_madeup_words": 8,
|
110 |
"pad_token": "<pad>",
|
111 |
"sep_token": "</s>",
|
112 |
"sp_model_kwargs": {},
|
113 |
+
"src_lang": "ru",
|
114 |
+
"tgt_lang": "zu",
|
115 |
"tokenizer_class": "M2M100Tokenizer",
|
116 |
"tokenizer_file": null,
|
117 |
"unk_token": "<unk>"
|