Update app.py
Browse files
app.py
CHANGED
@@ -6,22 +6,22 @@ import torch, json
|
|
6 |
tokenizer = AutoTokenizer.from_pretrained("distilroberta-base")
|
7 |
|
8 |
with open("dataset_types_encoded.json", "r") as fp:
|
9 |
-
|
10 |
|
11 |
-
|
12 |
|
13 |
inf_session = rt.InferenceSession('dataset-classifier-distilroberta-quantized.onnx')
|
14 |
input_name = inf_session.get_inputs()[0].name
|
15 |
output_name = inf_session.get_outputs()[0].name
|
16 |
|
17 |
-
def
|
18 |
input_ids = tokenizer(description)['input_ids'][:512]
|
19 |
logits = inf_session.run([output_name], {input_name: [input_ids]})[0]
|
20 |
logits = torch.FloatTensor(logits)
|
21 |
probs = torch.sigmoid(logits)[0]
|
22 |
-
return dict(zip(
|
23 |
|
24 |
label = gr.outputs.Label(num_top_classes=3)
|
25 |
-
iface = gr.Interface(fn=
|
26 |
iface.launch(inline=False)
|
27 |
|
|
|
6 |
tokenizer = AutoTokenizer.from_pretrained("distilroberta-base")
|
7 |
|
8 |
with open("dataset_types_encoded.json", "r") as fp:
|
9 |
+
encode_category_types = json.load(fp)
|
10 |
|
11 |
+
categories = list(encode_category_types.keys())
|
12 |
|
13 |
inf_session = rt.InferenceSession('dataset-classifier-distilroberta-quantized.onnx')
|
14 |
input_name = inf_session.get_inputs()[0].name
|
15 |
output_name = inf_session.get_outputs()[0].name
|
16 |
|
17 |
+
def classify_dataset_type(description):
|
18 |
input_ids = tokenizer(description)['input_ids'][:512]
|
19 |
logits = inf_session.run([output_name], {input_name: [input_ids]})[0]
|
20 |
logits = torch.FloatTensor(logits)
|
21 |
probs = torch.sigmoid(logits)[0]
|
22 |
+
return dict(zip(categories, map(float, probs)))
|
23 |
|
24 |
label = gr.outputs.Label(num_top_classes=3)
|
25 |
+
iface = gr.Interface(fn=classify_dataset_type, inputs="text", outputs=label)
|
26 |
iface.launch(inline=False)
|
27 |
|