Spaces:

rianders
/

live_view_embeddings

Running

rianders commited on May 13

Commit

95c80a2

•

1 Parent(s): 24297f2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,19 +11,20 @@ def get_bert_embeddings(words):
     model = BertModel.from_pretrained('bert-base-uncased')
     embeddings = []
-    # Extract embeddings
     for word in words:
         inputs = tokenizer(word, return_tensors='pt')
         outputs = model(**inputs)
-        embeddings.append(outputs.last_hidden_state[0][0].detach().numpy())
-    # Reduce dimensions to 3 using PCA
     if len(embeddings) > 0:
         pca = PCA(n_components=3)
         reduced_embeddings = pca.fit_transform(np.array(embeddings))
         return reduced_embeddings
     return []
 # Plotly plotting function
 def plot_interactive_bert_embeddings(embeddings, words):
     if len(words) < 4:

     model = BertModel.from_pretrained('bert-base-uncased')
     embeddings = []
     for word in words:
         inputs = tokenizer(word, return_tensors='pt')
         outputs = model(**inputs)
+        # Use the [CLS] token's embedding
+        cls_embedding = outputs.last_hidden_state[0][0].detach().numpy()
+        embeddings.append(cls_embedding)
     if len(embeddings) > 0:
         pca = PCA(n_components=3)
         reduced_embeddings = pca.fit_transform(np.array(embeddings))
         return reduced_embeddings
     return []
 # Plotly plotting function
 def plot_interactive_bert_embeddings(embeddings, words):
     if len(words) < 4: