KoichiYasuoka commited on
Commit
b87dbd2
1 Parent(s): 43e4326

常用漢字 support

Browse files
Files changed (1) hide show
  1. tokenizer.json +29 -1
tokenizer.json CHANGED
@@ -67,6 +67,34 @@
67
  "Regex": " {2,}"
68
  },
69
  "content": " "
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  }
71
  ]
72
  },
@@ -128166,4 +128194,4 @@
128166
  ]
128167
  ]
128168
  }
128169
- }
 
67
  "Regex": " {2,}"
68
  },
69
  "content": " "
70
+ },
71
+ {
72
+ "type": "Replace",
73
+ "pattern": {
74
+ "String": "𠮟"
75
+ },
76
+ "content": "叱"
77
+ },
78
+ {
79
+ "type": "Replace",
80
+ "pattern": {
81
+ "String": "塡"
82
+ },
83
+ "content": "填"
84
+ },
85
+ {
86
+ "type": "Replace",
87
+ "pattern": {
88
+ "String": "剝"
89
+ },
90
+ "content": "剥"
91
+ },
92
+ {
93
+ "type": "Replace",
94
+ "pattern": {
95
+ "String": "頰"
96
+ },
97
+ "content": "頬"
98
  }
99
  ]
100
  },
 
128194
  ]
128195
  ]
128196
  }
128197
+ }