Sonnyjim commited on
Commit
9c6425d
1 Parent(s): 4effac0

Fixed file load with files including capital letters

Browse files
Files changed (2) hide show
  1. funcs/embeddings.py +1 -1
  2. funcs/helper_functions.py +4 -4
funcs/embeddings.py CHANGED
@@ -18,7 +18,7 @@ def make_or_load_embeddings(docs, file_list, embeddings_out, embedding_model, em
18
  if embeddings_out.size == 0:
19
  print("Embeddings not found. Loading or generating new ones.")
20
 
21
- embeddings_file_names = [string.lower() for string in file_list if "embedding" in string.lower()]
22
 
23
  if embeddings_file_names:
24
  embeddings_file_name = embeddings_file_names[0]
 
18
  if embeddings_out.size == 0:
19
  print("Embeddings not found. Loading or generating new ones.")
20
 
21
+ embeddings_file_names = [string for string in file_list if "embedding" in string.lower()]
22
 
23
  if embeddings_file_names:
24
  embeddings_file_name = embeddings_file_names[0]
funcs/helper_functions.py CHANGED
@@ -96,7 +96,7 @@ def initial_file_load(in_file):
96
 
97
  file_list = [string.name for string in in_file]
98
 
99
- data_file_names = [string.lower() for string in file_list if "npz" not in string.lower() and "pkl" not in string.lower() and "topic_list.csv" not in string.lower()]
100
  if data_file_names:
101
  data_file_name = data_file_names[0]
102
  df = read_file(data_file_name)
@@ -110,19 +110,19 @@ def initial_file_load(in_file):
110
  print(error)
111
  output_text = error
112
 
113
- model_file_names = [string.lower() for string in file_list if "pkl" in string.lower()]
114
  if model_file_names:
115
  model_file_name = model_file_names[0]
116
  topic_model = read_file(model_file_name)
117
  output_text = "Bertopic model loaded."
118
 
119
- embedding_file_names = [string.lower() for string in file_list if "npz" in string.lower()]
120
  if embedding_file_names:
121
  embedding_file_name = embedding_file_names[0]
122
  embeddings = read_file(embedding_file_name)
123
  output_text = "Embeddings loaded."
124
 
125
- label_file_names = [string.lower() for string in file_list if "topic_list" in string.lower()]
126
  if label_file_names:
127
  label_file_name = label_file_names[0]
128
  custom_labels = read_file(label_file_name)
 
96
 
97
  file_list = [string.name for string in in_file]
98
 
99
+ data_file_names = [string for string in file_list if "npz" not in string.lower() and "pkl" not in string.lower() and "topic_list.csv" not in string.lower()]
100
  if data_file_names:
101
  data_file_name = data_file_names[0]
102
  df = read_file(data_file_name)
 
110
  print(error)
111
  output_text = error
112
 
113
+ model_file_names = [string for string in file_list if "pkl" in string.lower()]
114
  if model_file_names:
115
  model_file_name = model_file_names[0]
116
  topic_model = read_file(model_file_name)
117
  output_text = "Bertopic model loaded."
118
 
119
+ embedding_file_names = [string for string in file_list if "npz" in string.lower()]
120
  if embedding_file_names:
121
  embedding_file_name = embedding_file_names[0]
122
  embeddings = read_file(embedding_file_name)
123
  output_text = "Embeddings loaded."
124
 
125
+ label_file_names = [string for string in file_list if "topic_list" in string.lower()]
126
  if label_file_names:
127
  label_file_name = label_file_names[0]
128
  custom_labels = read_file(label_file_name)