KoichiYasuoka commited on
Commit
4f4a0f6
1 Parent(s): a89586b
Files changed (1) hide show
  1. ud.py +1 -1
ud.py CHANGED
@@ -78,7 +78,7 @@ class MecabPreTokenizer(MecabTokenizer):
78
  else:
79
  e=s+len(c)
80
  z.append((s,e))
81
- return [normalized_string[s:e] for s,e in z]
82
  def pre_tokenize(self,pretok):
83
  pretok.split(self.mecab_split)
84
 
 
78
  else:
79
  e=s+len(c)
80
  z.append((s,e))
81
+ return [normalized_string[s:e] for s,e in z if e>0]
82
  def pre_tokenize(self,pretok):
83
  pretok.split(self.mecab_split)
84