philschmid
/

msmarco-distilbert-base-tas-b-onnx

Text Classification

Model card Files Files and versions Community

philschmid commited on Jun 24, 2022

Commit

4865f8a

·

1 Parent(s): 770e1d9

Update pipeline.py

Files changed (1) hide show

pipeline.py +5 -13

pipeline.py CHANGED Viewed

@@ -1,6 +1,6 @@
-from typing import  Dict, List, Any
 from optimum.onnxruntime import ORTModelForFeatureExtraction
-from transformers import pipeline, AutoTokenizer
 def cls_pooling(model_output):
     return model_output.last_hidden_state[:,0]
@@ -11,20 +11,12 @@ class PreTrainedPipeline():
         self.tokenizer = AutoTokenizer.from_pretrained(path, model_max_length=128)
-    def __call__(self, inputs: Any) -> Dict[str, Any]:
-        """
-        Args:
-            data (:obj:`str`):
-                a string containing some text
-        Return:
-            A :obj:`list`:. The object returned should be a list of one list like [[{"label": 0.9939950108528137}]] containing :
-                - "label": A string representing what the label/class is. There can be multiple labels.
-                - "score": A score between 0 and 1 describing how confident the model is for this label/class.
-        """
         # tokenize the input
         encoded_input = self.tokenizer(inputs, padding="longest", truncation=True, return_tensors='pt')
         # run the model
         model_output = self.model(**encoded_input, return_dict=True)
         embeddings = cls_pooling(model_output)
-        return {"vectors": [float(vec) for vec in embeddings[0].tolist()]}

+from typing import  Dict,List, Any
 from optimum.onnxruntime import ORTModelForFeatureExtraction
+from transformers import  AutoTokenizer
 def cls_pooling(model_output):
     return model_output.last_hidden_state[:,0]
         self.tokenizer = AutoTokenizer.from_pretrained(path, model_max_length=128)
+    def __call__(self, inputs: Any) -> Dict[str, List[float]]:
         # tokenize the input
         encoded_input = self.tokenizer(inputs, padding="longest", truncation=True, return_tensors='pt')
         # run the model
         model_output = self.model(**encoded_input, return_dict=True)
         embeddings = cls_pooling(model_output)
+        return {"vectors": embeddings[0].tolist()}