KoichiYasuoka commited on
Commit
43e4326
1 Parent(s): 1a1a985
Files changed (1) hide show
  1. ud.py +1 -1
ud.py CHANGED
@@ -78,7 +78,7 @@ class MecabPreTokenizer(MecabTokenizer):
78
  else:
79
  e=s+len(c)
80
  z.append((s,e))
81
- return [normalized_string[s:e] for s,e in z]
82
  def pre_tokenize(self,pretok):
83
  pretok.split(self.mecab_split)
84
 
78
  else:
79
  e=s+len(c)
80
  z.append((s,e))
81
+ return [normalized_string[s:e] for s,e in z if e>0]
82
  def pre_tokenize(self,pretok):
83
  pretok.split(self.mecab_split)
84