Spaces:

awacke1
/

Transcript-EDA-NLTK

Sleeping

awacke1 commited on Mar 14

Commit

0718e3a

•

1 Parent(s): 6556590

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -108,10 +108,16 @@ def load_example_files():
     return None
 def cluster_sentences(sentences, num_clusters):
     # Filter sentences with length over 10 characters
     sentences = [sentence for sentence in sentences if len(sentence) > 10]
     # Vectorize the sentences
     vectorizer = TfidfVectorizer()
     X = vectorizer.fit_transform(sentences)
@@ -136,6 +142,7 @@ def cluster_sentences(sentences, num_clusters):
     # Return the ordered clustered sentences without similarity scores for display
     return [[sentence for _, sentence in cluster] for cluster in clustered_sentences]
 # Function to convert text to a downloadable file
 def get_text_file_download_link(text_to_download, filename='Output.txt', button_label="💾 Save"):
     buffer = BytesIO()

     return None
 def cluster_sentences(sentences, num_clusters):
     # Filter sentences with length over 10 characters
     sentences = [sentence for sentence in sentences if len(sentence) > 10]
+    # Check if the number of sentences is less than the desired number of clusters
+    if len(sentences) < num_clusters:
+        # If so, adjust the number of clusters to match the number of sentences
+        num_clusters = len(sentences)
     # Vectorize the sentences
     vectorizer = TfidfVectorizer()
     X = vectorizer.fit_transform(sentences)
     # Return the ordered clustered sentences without similarity scores for display
     return [[sentence for _, sentence in cluster] for cluster in clustered_sentences]
 # Function to convert text to a downloadable file
 def get_text_file_download_link(text_to_download, filename='Output.txt', button_label="💾 Save"):
     buffer = BytesIO()