Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -36,8 +36,15 @@ def extract_embeddings(batch):
|
|
| 36 |
embeddings_dataset = tokenized_datasets.map(extract_embeddings, batched=True, batch_size=batch_size)
|
| 37 |
|
| 38 |
# Access the embeddings
|
| 39 |
-
|
|
|
|
| 40 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 41 |
# Perform unsupervised clustering (K-Means)
|
| 42 |
num_clusters = 5 # You can adjust this based on your data
|
| 43 |
kmeans = KMeans(n_clusters=num_clusters)
|
|
|
|
| 36 |
embeddings_dataset = tokenized_datasets.map(extract_embeddings, batched=True, batch_size=batch_size)
|
| 37 |
|
| 38 |
# Access the embeddings
|
| 39 |
+
# Debugging code to print dataset keys
|
| 40 |
+
st.write("Dataset Keys:", embeddings_dataset.column_names)
|
| 41 |
|
| 42 |
+
# Access the embeddings
|
| 43 |
+
if "embeddings" in embeddings_dataset.column_names:
|
| 44 |
+
embeddings = np.vstack(embeddings_dataset["embeddings"])
|
| 45 |
+
else:
|
| 46 |
+
st.error("The 'embeddings' key is not present in the dataset.")
|
| 47 |
+
|
| 48 |
# Perform unsupervised clustering (K-Means)
|
| 49 |
num_clusters = 5 # You can adjust this based on your data
|
| 50 |
kmeans = KMeans(n_clusters=num_clusters)
|