KoichiYasuoka
commited on
Commit
•
b87dbd2
1
Parent(s):
43e4326
常用漢字 support
Browse files- tokenizer.json +29 -1
tokenizer.json
CHANGED
@@ -67,6 +67,34 @@
|
|
67 |
"Regex": " {2,}"
|
68 |
},
|
69 |
"content": " "
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
70 |
}
|
71 |
]
|
72 |
},
|
@@ -128166,4 +128194,4 @@
|
|
128166 |
]
|
128167 |
]
|
128168 |
}
|
128169 |
-
}
|
|
|
67 |
"Regex": " {2,}"
|
68 |
},
|
69 |
"content": " "
|
70 |
+
},
|
71 |
+
{
|
72 |
+
"type": "Replace",
|
73 |
+
"pattern": {
|
74 |
+
"String": "𠮟"
|
75 |
+
},
|
76 |
+
"content": "叱"
|
77 |
+
},
|
78 |
+
{
|
79 |
+
"type": "Replace",
|
80 |
+
"pattern": {
|
81 |
+
"String": "塡"
|
82 |
+
},
|
83 |
+
"content": "填"
|
84 |
+
},
|
85 |
+
{
|
86 |
+
"type": "Replace",
|
87 |
+
"pattern": {
|
88 |
+
"String": "剝"
|
89 |
+
},
|
90 |
+
"content": "剥"
|
91 |
+
},
|
92 |
+
{
|
93 |
+
"type": "Replace",
|
94 |
+
"pattern": {
|
95 |
+
"String": "頰"
|
96 |
+
},
|
97 |
+
"content": "頬"
|
98 |
}
|
99 |
]
|
100 |
},
|
|
|
128194 |
]
|
128195 |
]
|
128196 |
}
|
128197 |
+
}
|