sberhe commited on
Commit
419397e
·
1 Parent(s): 9363e7a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -1
app.py CHANGED
@@ -36,8 +36,15 @@ def extract_embeddings(batch):
36
  embeddings_dataset = tokenized_datasets.map(extract_embeddings, batched=True, batch_size=batch_size)
37
 
38
  # Access the embeddings
39
- embeddings = np.vstack(embeddings_dataset["embeddings"])
 
40
 
 
 
 
 
 
 
41
  # Perform unsupervised clustering (K-Means)
42
  num_clusters = 5 # You can adjust this based on your data
43
  kmeans = KMeans(n_clusters=num_clusters)
 
36
  embeddings_dataset = tokenized_datasets.map(extract_embeddings, batched=True, batch_size=batch_size)
37
 
38
  # Access the embeddings
39
+ # Debugging code to print dataset keys
40
+ st.write("Dataset Keys:", embeddings_dataset.column_names)
41
 
42
+ # Access the embeddings
43
+ if "embeddings" in embeddings_dataset.column_names:
44
+ embeddings = np.vstack(embeddings_dataset["embeddings"])
45
+ else:
46
+ st.error("The 'embeddings' key is not present in the dataset.")
47
+
48
  # Perform unsupervised clustering (K-Means)
49
  num_clusters = 5 # You can adjust this based on your data
50
  kmeans = KMeans(n_clusters=num_clusters)