KoichiYasuoka commited on
Commit
faba6e7
1 Parent(s): 8f0399e
Files changed (1) hide show
  1. README.md +2 -1
README.md CHANGED
@@ -53,8 +53,9 @@ class TaggerPipeline(TokenClassificationPipeline):
53
  a2b,b2a=tokenizations.get_alignments(v,text)
54
  for i,t in enumerate(a2b):
55
  s,e=(0,0) if t==[] else (t[0],t[-1]+1)
56
- if t==[] and v[i]==self.tokenizer.unk_token:
57
  s=([[-1]]+[x for x in a2b[0:i] if x>[]])[-1][-1]+1
 
58
  e=([x for x in a2b[i+1:] if x>[]]+[[len(text)]])[0][0]
59
  d[i]["start"],d[i]["end"]=s,e
60
  return d
 
53
  a2b,b2a=tokenizations.get_alignments(v,text)
54
  for i,t in enumerate(a2b):
55
  s,e=(0,0) if t==[] else (t[0],t[-1]+1)
56
+ if v[i].startswith(self.tokenizer.unk_token):
57
  s=([[-1]]+[x for x in a2b[0:i] if x>[]])[-1][-1]+1
58
+ if v[i].endswith(self.tokenizer.unk_token):
59
  e=([x for x in a2b[i+1:] if x>[]]+[[len(text)]])[0][0]
60
  d[i]["start"],d[i]["end"]=s,e
61
  return d