Spaces:
Runtime error
Runtime error
sameemul-haque
commited on
Commit
•
ae244b4
1
Parent(s):
43a5958
refactor: remove unused code
Browse files
app.py
CHANGED
@@ -1,15 +1,10 @@
|
|
1 |
-
import os
|
2 |
-
import
|
3 |
-
import pickle
|
4 |
-
import textwrap
|
5 |
-
from pprint import pprint
|
6 |
from dotenv import load_dotenv
|
7 |
from langchain.chains import RetrievalQA
|
8 |
-
from InstructorEmbedding import INSTRUCTOR
|
9 |
from langchain_community.vectorstores import FAISS
|
10 |
from langchain_community.llms import HuggingFaceHub
|
11 |
from langchain_community.document_loaders import PyPDFLoader
|
12 |
-
from transformers import AutoTokenizer, AutoModelForCausalLM
|
13 |
from langchain_community.document_loaders import DirectoryLoader
|
14 |
from langchain.text_splitter import RecursiveCharacterTextSplitter
|
15 |
from langchain_community.embeddings import HuggingFaceInstructEmbeddings
|
@@ -26,22 +21,7 @@ def main():
|
|
26 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
|
27 |
texts = text_splitter.split_documents(documents)
|
28 |
|
29 |
-
# store the embeddings
|
30 |
-
# def store_embeddings(docs, embeddings, sotre_name, path):
|
31 |
-
# vectorStore = FAISS.from_documents(docs, embeddings)
|
32 |
-
# with open(f"{path}/faiss_{sotre_name}.pkl", "wb") as f:
|
33 |
-
# pickle.dump(vectorStore, f)
|
34 |
-
|
35 |
-
# def load_embeddings(sotre_name, path):
|
36 |
-
# with open(f"{path}/faiss_{sotre_name}.pkl", "rb") as f:
|
37 |
-
# VectorStore = pickle.load(f)
|
38 |
-
# return VectorStore
|
39 |
-
|
40 |
instructor_embeddings = HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-xl")
|
41 |
-
Embedding_store_path = f"./Embedding_store"
|
42 |
-
|
43 |
-
# store_embeddings(texts, instructor_embeddings, sotre_name='instructEmbeddings', path=Embedding_store_path)
|
44 |
-
# db_instructEmbedd = load_embeddings(sotre_name='instructEmbeddings', path=Embedding_store_path)
|
45 |
|
46 |
# create the retriever
|
47 |
db_instructEmbedd = FAISS.from_documents(texts, instructor_embeddings)
|
@@ -81,4 +61,4 @@ def main():
|
|
81 |
process_llm_response(llm_response)
|
82 |
|
83 |
if __name__ == '__main__':
|
84 |
-
main()
|
|
|
1 |
+
import os, textwrap
|
2 |
+
from pprint import pprint
|
|
|
|
|
|
|
3 |
from dotenv import load_dotenv
|
4 |
from langchain.chains import RetrievalQA
|
|
|
5 |
from langchain_community.vectorstores import FAISS
|
6 |
from langchain_community.llms import HuggingFaceHub
|
7 |
from langchain_community.document_loaders import PyPDFLoader
|
|
|
8 |
from langchain_community.document_loaders import DirectoryLoader
|
9 |
from langchain.text_splitter import RecursiveCharacterTextSplitter
|
10 |
from langchain_community.embeddings import HuggingFaceInstructEmbeddings
|
|
|
21 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
|
22 |
texts = text_splitter.split_documents(documents)
|
23 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
24 |
instructor_embeddings = HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-xl")
|
|
|
|
|
|
|
|
|
25 |
|
26 |
# create the retriever
|
27 |
db_instructEmbedd = FAISS.from_documents(texts, instructor_embeddings)
|
|
|
61 |
process_llm_response(llm_response)
|
62 |
|
63 |
if __name__ == '__main__':
|
64 |
+
main()
|