Spaces:
Runtime error
Runtime error
- ape/instance.py +9 -4
ape/instance.py
CHANGED
@@ -80,9 +80,12 @@ def load_qa(file='./ape/data/qa_train.json'):
|
|
80 |
raw_data = json.load(open(file, encoding='UTF8'))
|
81 |
for i in raw_data:
|
82 |
input = i['text']
|
83 |
-
|
84 |
-
output =
|
85 |
-
|
|
|
|
|
|
|
86 |
data.append((input, output))
|
87 |
return data
|
88 |
|
@@ -103,7 +106,9 @@ def load_entity(file='./ape/data/entity_train.json'):
|
|
103 |
input = i['text']
|
104 |
output = []
|
105 |
for j in i['labels']:
|
106 |
-
|
|
|
|
|
107 |
output = json.dumps(output, ensure_ascii=False)
|
108 |
data.append((input, output))
|
109 |
return data
|
|
|
80 |
raw_data = json.load(open(file, encoding='UTF8'))
|
81 |
for i in raw_data:
|
82 |
input = i['text']
|
83 |
+
# 只取一个QA不然容易超出模型输入长度'
|
84 |
+
output = []
|
85 |
+
for j in i['annotations']:
|
86 |
+
output.append(json.dumps({'问题': j["Q"], '回答': j["A"]}, ensure_ascii=False))
|
87 |
+
output = sorted(output, key=lambda x: len(x))
|
88 |
+
output = output[0]
|
89 |
data.append((input, output))
|
90 |
return data
|
91 |
|
|
|
106 |
input = i['text']
|
107 |
output = []
|
108 |
for j in i['labels']:
|
109 |
+
##筛选局部实体类型,也可以拆分成单个实体类型
|
110 |
+
if j[1] in ['DRUG_DOSAGE', 'DRUG_TASTE', 'DRUG_EFFICACY']:
|
111 |
+
output.append({'类型': j[1], '实体': j[-1]})
|
112 |
output = json.dumps(output, ensure_ascii=False)
|
113 |
data.append((input, output))
|
114 |
return data
|