sameemul-haque commited on
Commit
ae244b4
1 Parent(s): 43a5958

refactor: remove unused code

Browse files
Files changed (1) hide show
  1. app.py +3 -23
app.py CHANGED
@@ -1,15 +1,10 @@
1
- import os
2
- import faiss
3
- import pickle
4
- import textwrap
5
- from pprint import pprint
6
  from dotenv import load_dotenv
7
  from langchain.chains import RetrievalQA
8
- from InstructorEmbedding import INSTRUCTOR
9
  from langchain_community.vectorstores import FAISS
10
  from langchain_community.llms import HuggingFaceHub
11
  from langchain_community.document_loaders import PyPDFLoader
12
- from transformers import AutoTokenizer, AutoModelForCausalLM
13
  from langchain_community.document_loaders import DirectoryLoader
14
  from langchain.text_splitter import RecursiveCharacterTextSplitter
15
  from langchain_community.embeddings import HuggingFaceInstructEmbeddings
@@ -26,22 +21,7 @@ def main():
26
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
27
  texts = text_splitter.split_documents(documents)
28
 
29
- # store the embeddings
30
- # def store_embeddings(docs, embeddings, sotre_name, path):
31
- # vectorStore = FAISS.from_documents(docs, embeddings)
32
- # with open(f"{path}/faiss_{sotre_name}.pkl", "wb") as f:
33
- # pickle.dump(vectorStore, f)
34
-
35
- # def load_embeddings(sotre_name, path):
36
- # with open(f"{path}/faiss_{sotre_name}.pkl", "rb") as f:
37
- # VectorStore = pickle.load(f)
38
- # return VectorStore
39
-
40
  instructor_embeddings = HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-xl")
41
- Embedding_store_path = f"./Embedding_store"
42
-
43
- # store_embeddings(texts, instructor_embeddings, sotre_name='instructEmbeddings', path=Embedding_store_path)
44
- # db_instructEmbedd = load_embeddings(sotre_name='instructEmbeddings', path=Embedding_store_path)
45
 
46
  # create the retriever
47
  db_instructEmbedd = FAISS.from_documents(texts, instructor_embeddings)
@@ -81,4 +61,4 @@ def main():
81
  process_llm_response(llm_response)
82
 
83
  if __name__ == '__main__':
84
- main()
 
1
+ import os, textwrap
2
+ from pprint import pprint
 
 
 
3
  from dotenv import load_dotenv
4
  from langchain.chains import RetrievalQA
 
5
  from langchain_community.vectorstores import FAISS
6
  from langchain_community.llms import HuggingFaceHub
7
  from langchain_community.document_loaders import PyPDFLoader
 
8
  from langchain_community.document_loaders import DirectoryLoader
9
  from langchain.text_splitter import RecursiveCharacterTextSplitter
10
  from langchain_community.embeddings import HuggingFaceInstructEmbeddings
 
21
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
22
  texts = text_splitter.split_documents(documents)
23
 
 
 
 
 
 
 
 
 
 
 
 
24
  instructor_embeddings = HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-xl")
 
 
 
 
25
 
26
  # create the retriever
27
  db_instructEmbedd = FAISS.from_documents(texts, instructor_embeddings)
 
61
  process_llm_response(llm_response)
62
 
63
  if __name__ == '__main__':
64
+ main()