Spaces:

bohmian
/

esg_countries_chatbot

Sleeping

bohmian commited on Feb 15, 2024

Commit

8ee023c

verified ·

1 Parent(s): 41c7fd6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -180,12 +180,11 @@ def get_llm():
     return llm
 # for chromadb vectore store
-def get_embeddings():
-    with st.spinner(f'Getting HuggingFaceEmbeddings'):
-        # We use HuggingFaceEmbeddings() as it is open source and free to use.
-        # Initialize the default hf model for embedding the tokenized texts into vectors with semantic meanings
-        hf_embeddings = HuggingFaceEmbeddings()
-        return hf_embeddings
 # call above functions
 llm = get_llm()
@@ -279,7 +278,7 @@ def check_for_new_retrievers():
     # loop through new docs in chroma retrievers created by user scraping/pdf (if any)
     try:
         for doc in new_documents_chroma:
-            if (("bm25/" + doc.split('/')[1] + ".pickle") in new_documents_bm25): # check that the doc also exists for bm25 retriever
                 new_doc_country = doc.split('_')[1]
                 new_doc_chunk_size = doc.split('_')[3]

     return llm
 # for chromadb vectore store
+def get_embeddings():
+    # We use HuggingFaceEmbeddings() as it is open source and free to use.
+    # Initialize the default hf model for embedding the tokenized texts into vectors with semantic meanings
+    hf_embeddings = HuggingFaceEmbeddings()
+    return hf_embeddings
 # call above functions
 llm = get_llm()
     # loop through new docs in chroma retrievers created by user scraping/pdf (if any)
     try:
         for doc in new_documents_chroma:
+            if ((("bm25\\" + doc.split('\\')[1] + ".pickle") in new_documents_bm25) | (("bm25/" + doc.split('/')[1] + ".pickle") in new_documents_bm25)): # check that the doc also exists for bm25 retriever
                 new_doc_country = doc.split('_')[1]
                 new_doc_chunk_size = doc.split('_')[3]