vamsibanda
commited on
Commit
•
8a2d2a7
1
Parent(s):
eb644f5
Update README.md
Browse files
README.md
CHANGED
@@ -43,6 +43,13 @@ model_name = 'vamsibanda/sbert-onnx-all-roberta-large-v1'
|
|
43 |
cache_folder = './'
|
44 |
model_path = os.path.join(cache_folder, model_name.replace("/", "_"))
|
45 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
46 |
def mean_pooling(model_output, attention_mask):
|
47 |
token_embeddings = model_output[0] #First element of model_output contains all token embeddings
|
48 |
input_mask_expanded = attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
|
@@ -65,10 +72,6 @@ tokenizer = AutoTokenizer.from_pretrained(model_path)
|
|
65 |
model = ORTModelForFeatureExtraction.from_pretrained(model_path, force_download=False)
|
66 |
pooling_layer = Pooling.load(f"{model_path}/1_Pooling")
|
67 |
|
68 |
-
|
69 |
-
embeddings = model(input_ids=token['input_ids'], attention_mask=token['attention_mask'])
|
70 |
-
sbert_embeddings = mean_pooling(embeddings, token['attention_mask'])
|
71 |
-
sbert_embeddings = F.normalize(sbert_embeddings, p=2, dim=1)
|
72 |
-
sbert_embeddings.tolist()[0]
|
73 |
|
74 |
```
|
|
|
43 |
cache_folder = './'
|
44 |
model_path = os.path.join(cache_folder, model_name.replace("/", "_"))
|
45 |
|
46 |
+
def generate_embedding(text):
|
47 |
+
token = tokenizer(text, return_tensors='pt')
|
48 |
+
embeddings = model(input_ids=token['input_ids'], attention_mask=token['attention_mask'])
|
49 |
+
sbert_embeddings = mean_pooling(embeddings, token['attention_mask'])
|
50 |
+
sbert_embeddings = F.normalize(sbert_embeddings, p=2, dim=1)
|
51 |
+
return sbert_embeddings.tolist()[0]
|
52 |
+
|
53 |
def mean_pooling(model_output, attention_mask):
|
54 |
token_embeddings = model_output[0] #First element of model_output contains all token embeddings
|
55 |
input_mask_expanded = attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
|
|
|
72 |
model = ORTModelForFeatureExtraction.from_pretrained(model_path, force_download=False)
|
73 |
pooling_layer = Pooling.load(f"{model_path}/1_Pooling")
|
74 |
|
75 |
+
generate_embedding('That is a happy person')
|
|
|
|
|
|
|
|
|
76 |
|
77 |
```
|