KoichiYasuoka
commited on
Commit
•
faba6e7
1
Parent(s):
8f0399e
bug fix
Browse files
README.md
CHANGED
@@ -53,8 +53,9 @@ class TaggerPipeline(TokenClassificationPipeline):
|
|
53 |
a2b,b2a=tokenizations.get_alignments(v,text)
|
54 |
for i,t in enumerate(a2b):
|
55 |
s,e=(0,0) if t==[] else (t[0],t[-1]+1)
|
56 |
-
if
|
57 |
s=([[-1]]+[x for x in a2b[0:i] if x>[]])[-1][-1]+1
|
|
|
58 |
e=([x for x in a2b[i+1:] if x>[]]+[[len(text)]])[0][0]
|
59 |
d[i]["start"],d[i]["end"]=s,e
|
60 |
return d
|
|
|
53 |
a2b,b2a=tokenizations.get_alignments(v,text)
|
54 |
for i,t in enumerate(a2b):
|
55 |
s,e=(0,0) if t==[] else (t[0],t[-1]+1)
|
56 |
+
if v[i].startswith(self.tokenizer.unk_token):
|
57 |
s=([[-1]]+[x for x in a2b[0:i] if x>[]])[-1][-1]+1
|
58 |
+
if v[i].endswith(self.tokenizer.unk_token):
|
59 |
e=([x for x in a2b[i+1:] if x>[]]+[[len(text)]])[0][0]
|
60 |
d[i]["start"],d[i]["end"]=s,e
|
61 |
return d
|