grapheme-llama / tokenizer_config.json
bbunzeck's picture
Upload 7 files
c88d306 verified
{
"added_tokens_decoder": {
"0": {
"content": "<|endoftext|>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"1": {
"content": "<pad>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"2": {
"content": "Y",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"3": {
"content": "e",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"4": {
"content": "a",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"5": {
"content": "h",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"6": {
"content": ".",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"7": {
"content": "\n",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"8": {
"content": "C",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"9": {
"content": "o",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"10": {
"content": "m",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"11": {
"content": "p",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"12": {
"content": "u",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"13": {
"content": "n",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"14": {
"content": "d",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"15": {
"content": "'",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"16": {
"content": "s",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"17": {
"content": " ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"18": {
"content": "t",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"19": {
"content": "i",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"20": {
"content": "g",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"21": {
"content": "l",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"22": {
"content": "k",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"23": {
"content": "x",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"24": {
"content": ",",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"25": {
"content": "r",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"26": {
"content": "N",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"27": {
"content": "w",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"28": {
"content": "v",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"29": {
"content": "T",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"30": {
"content": "f",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"31": {
"content": "A",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"32": {
"content": "b",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"33": {
"content": "E",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"34": {
"content": "c",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"35": {
"content": "y",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"36": {
"content": "O",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"37": {
"content": "S",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"38": {
"content": "j",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"39": {
"content": "I",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"40": {
"content": "R",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"41": {
"content": "?",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"42": {
"content": "D",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"43": {
"content": "-",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"44": {
"content": "q",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"45": {
"content": "W",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"46": {
"content": "Q",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"47": {
"content": "M",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"48": {
"content": "B",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"49": {
"content": "H",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"50": {
"content": "L",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"51": {
"content": "F",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"52": {
"content": "P",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"53": {
"content": "G",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"54": {
"content": "U",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"55": {
"content": "J",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"56": {
"content": "X",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"57": {
"content": ";",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"58": {
"content": "2",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"59": {
"content": "V",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"60": {
"content": "‘",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"61": {
"content": "’",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"62": {
"content": "!",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"63": {
"content": "é",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"64": {
"content": "/",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"65": {
"content": "1",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"66": {
"content": ":",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"67": {
"content": "K",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"68": {
"content": "z",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"69": {
"content": "Z",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"70": {
"content": "3",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"71": {
"content": "6",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"72": {
"content": "9",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"73": {
"content": "&",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"74": {
"content": "4",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"75": {
"content": "5",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"76": {
"content": "0",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"77": {
"content": "=",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"78": {
"content": "8",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"79": {
"content": "7",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"80": {
"content": "£",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"81": {
"content": "(",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"82": {
"content": ")",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"83": {
"content": "—",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"84": {
"content": "*",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"85": {
"content": "\"",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"86": {
"content": "%",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"87": {
"content": "“",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"88": {
"content": "”",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"89": {
"content": "_",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"90": {
"content": "+",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"91": {
"content": "$",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"92": {
"content": "^",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"93": {
"content": "ʊ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"94": {
"content": "č",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"95": {
"content": "#",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"96": {
"content": "æ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"97": {
"content": "ʌ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"98": {
"content": "ɷ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"99": {
"content": "ɩ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"100": {
"content": "ɛ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"101": {
"content": "ə",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"102": {
"content": "↫",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"103": {
"content": "à",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"104": {
"content": "|",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"105": {
"content": "[",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"106": {
"content": "]",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"107": {
"content": "°",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"108": {
"content": "Ö",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"109": {
"content": "À",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"110": {
"content": "ç",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"111": {
"content": "è",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"112": {
"content": "É",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"113": {
"content": "â",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"114": {
"content": "Ø",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"115": {
"content": "ê",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"116": {
"content": "~",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"117": {
"content": "ë",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"118": {
"content": "―",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"119": {
"content": "ï",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"120": {
"content": "ô",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"121": {
"content": "ü",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"122": {
"content": "⁄",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"123": {
"content": "Â",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"124": {
"content": "á",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"125": {
"content": "`",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"126": {
"content": "Æ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"127": {
"content": "È",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"128": {
"content": "�",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"129": {
"content": "ñ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"130": {
"content": "í",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"131": {
"content": "ú",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"132": {
"content": "ā",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"133": {
"content": "ó",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"134": {
"content": "ĕ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"135": {
"content": "ō",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"136": {
"content": "ä",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"137": {
"content": "Ó",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"138": {
"content": "ē",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"139": {
"content": "′",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"140": {
"content": "ī",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"141": {
"content": "Á",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"142": {
"content": "û",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"143": {
"content": "ö",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"144": {
"content": "ń",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"145": {
"content": "ă",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"146": {
"content": "†",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"147": {
"content": "ĭ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"148": {
"content": "ū",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"149": {
"content": "Ú",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"150": {
"content": "î",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"151": {
"content": "Í",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"152": {
"content": "§",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"153": {
"content": "Ō",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"154": {
"content": "Ā",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"155": {
"content": "@",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"156": {
"content": "}",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"157": {
"content": "☛",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"158": {
"content": "☚",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"159": {
"content": "Ñ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"160": {
"content": "{",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"161": {
"content": "–",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"162": {
"content": "·",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"163": {
"content": "Ü",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"164": {
"content": "©",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"165": {
"content": "Ë",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"166": {
"content": "♪",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"167": {
"content": "ã",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"168": {
"content": "¡",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"169": {
"content": "¤",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"170": {
"content": "÷",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"171": {
"content": "Û",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"172": {
"content": "Î",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"173": {
"content": "\\",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"174": {
"content": "",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"175": {
"content": "¶",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"176": {
"content": "Ä",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"177": {
"content": "ì",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"178": {
"content": "ò",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"179": {
"content": "¢",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"180": {
"content": "ù",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"181": {
"content": "Ê",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"182": {
"content": "±",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"183": {
"content": "Ð",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"184": {
"content": "Ô",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"185": {
"content": "¿",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"186": {
"content": "­",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"187": {
"content": "Ï",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"188": {
"content": "ý",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"189": {
"content": "Þ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"190": {
"content": "Ã",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"191": {
"content": "Ý",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"192": {
"content": "Ì",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"193": {
"content": "⬄",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"194": {
"content": "š",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"195": {
"content": "ž",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"196": {
"content": "♫",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"197": {
"content": "€",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"198": {
"content": "œ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"199": {
"content": "",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"200": {
"content": "​",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"201": {
"content": "œ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"202": {
"content": "Œ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"203": {
"content": "Ÿ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"204": {
"content": "ł",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"205": {
"content": "ż",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"206": {
"content": "š",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"207": {
"content": "Š",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"208": {
"content": "ð",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"209": {
"content": "®",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"210": {
"content": "¬",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"211": {
"content": "Å",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"212": {
"content": "¦",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"213": {
"content": "Ç",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"214": {
"content": "å",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"215": {
"content": "ˆ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"216": {
"content": "ş",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"217": {
"content": "ø",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"218": {
"content": "×",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"219": {
"content": "",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"220": {
"content": "€",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"221": {
"content": "‎",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"222": {
"content": "؟",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"223": {
"content": "ـ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"224": {
"content": "™",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"225": {
"content": "Ò",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"226": {
"content": "Ù",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"227": {
"content": "þ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"228": {
"content": "ž",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"229": {
"content": "„",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"230": {
"content": "ė",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"231": {
"content": "‚",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"232": {
"content": "ć",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"233": {
"content": "ś",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"234": {
"content": "ą",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"235": {
"content": "Č",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"236": {
"content": "ğ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"237": {
"content": "ș",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"238": {
"content": "Ś",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"239": {
"content": "ß",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"240": {
"content": "∂",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"241": {
"content": "ŭ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"242": {
"content": "ˈ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"243": {
"content": "ɫ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"244": {
"content": "ʋ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"245": {
"content": "ɐ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"246": {
"content": "ı",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"247": {
"content": "ň",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"248": {
"content": "đ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"249": {
"content": "ř",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"250": {
"content": "ě",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"251": {
"content": "₤",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"252": {
"content": "ǔ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"253": {
"content": "ễ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"254": {
"content": "ệ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"255": {
"content": "ề",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"256": {
"content": "ơ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"257": {
"content": "Ż",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"258": {
"content": "ő",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"259": {
"content": "−",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"260": {
"content": "→",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"261": {
"content": "ę",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"262": {
"content": "ɑ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"263": {
"content": "ː",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"264": {
"content": "ɔ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"265": {
"content": "ţ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"266": {
"content": "Ž",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"267": {
"content": "Ł",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"268": {
"content": "õ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"269": {
"content": "Đ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"270": {
"content": "ỗ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"271": {
"content": "ư",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"272": {
"content": "ờ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"273": {
"content": "≈",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"274": {
"content": "⊙",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"275": {
"content": "•",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"276": {
"content": "Ř",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"277": {
"content": "ů",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"278": {
"content": "ħ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"279": {
"content": "ṭ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"280": {
"content": "ġ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"281": {
"content": "ǁ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"282": {
"content": "Ľ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"283": {
"content": "İ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"284": {
"content": "ț",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"285": {
"content": "􏿾",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"286": {
"content": "⟨",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"287": {
"content": "⟩",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"288": {
"content": "ộ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"289": {
"content": "ầ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"290": {
"content": "ữ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"291": {
"content": "ủ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"292": {
"content": "⋅",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"293": {
"content": "ʒ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"294": {
"content": "Ş",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"295": {
"content": "ɪ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"296": {
"content": "₹",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"297": {
"content": "☯",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"298": {
"content": "ļ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"299": {
"content": "♯",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"300": {
"content": "♭",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"301": {
"content": "ʃ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"302": {
"content": "ɨ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"303": {
"content": "Ș",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"304": {
"content": "ź",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"305": {
"content": "Ṃ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"306": {
"content": "ḷ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"307": {
"content": "ʑ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"308": {
"content": "ứ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"309": {
"content": "ạ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"310": {
"content": "ṅ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"311": {
"content": "་",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"312": {
"content": "ー",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"313": {
"content": "ŋ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"314": {
"content": "ʼ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"315": {
"content": "į",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"316": {
"content": "ņ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"317": {
"content": "ḍ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"318": {
"content": "ṇ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"319": {
"content": "ṣ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"320": {
"content": "၁",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"321": {
"content": "၂",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"322": {
"content": "၃",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"323": {
"content": "၄",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"324": {
"content": "၅",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"325": {
"content": "၆",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"326": {
"content": "၇",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"327": {
"content": "၈",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"328": {
"content": "၉",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"329": {
"content": "၀",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"330": {
"content": "ĺ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"331": {
"content": "ķ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"332": {
"content": "Ḥ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"333": {
"content": "ʻ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"334": {
"content": "¥",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"335": {
"content": "ǒ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"336": {
"content": "ọ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"337": {
"content": "˥",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"338": {
"content": "˨",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"339": {
"content": "˩",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"340": {
"content": "ˌ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"341": {
"content": "۰",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"342": {
"content": "ʾ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"343": {
"content": "ḥ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"344": {
"content": "ʿ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"345": {
"content": "ď",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"346": {
"content": "Ṭ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"347": {
"content": "ả",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"348": {
"content": "█",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"349": {
"content": "Ĥ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"350": {
"content": "∴",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"351": {
"content": "ŏ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"352": {
"content": "ʁ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"353": {
"content": "ľ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
},
"354": {
"content": "Õ",
"lstrip": false,
"normalized": true,
"rstrip": false,
"single_word": false,
"special": false
}
},
"bos_token": "<|endoftext|>",
"clean_up_tokenization_spaces": true,
"eos_token": "<|endoftext|>",
"model_max_length": 1000000000000000019884624838656,
"pad_token": "<|endoftext|>",
"tokenizer_class": "PreTrainedTokenizerFast"
}