deeplearningwithpython5240 commited on
Commit
b353170
1 Parent(s): a8ffb38

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -26,7 +26,7 @@ def process_data(input_data,columnname = 'text', num_data = 100):
26
  random.seed(20979738)
27
  processed_data = [i for i in input_data[columnname]]
28
  random_selection = random.sample(processed_data, num_data)
29
- filtered_data = filter_similar_items(random_selection, similarity_threshold = 0.9)
30
  st.write('Number of data input: ',len(random_selection))
31
  st.write('After removing duplicates: ',len(filtered_data))
32
  return filtered_data
 
26
  random.seed(20979738)
27
  processed_data = [i for i in input_data[columnname]]
28
  random_selection = random.sample(processed_data, num_data)
29
+ filtered_data = filter_similar_items(random_selection, similarity_threshold = 0.75)
30
  st.write('Number of data input: ',len(random_selection))
31
  st.write('After removing duplicates: ',len(filtered_data))
32
  return filtered_data