pdfchatbot / agent.py
ndn1954's picture
Create agent.py
41882a8
raw
history blame
No virus
1.81 kB
import os
from langchain.embeddings.openai import OpenAIEmbeddings
from langchain.document_loaders import PyPDFLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.vectorstores import FAISS
from langchain.chains import ConversationalRetrievalChain
from langchain.llms import OpenAI
class Agent:
def __init__(self, openai_api_key: str | None = None) -> None:
# if openai_api_key is None, then it will look the enviroment variable OPENAI_API_KEY
self.embeddings = OpenAIEmbeddings(openai_api_key=openai_api_key)
self.text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
self.llm = OpenAI(temperature=0, openai_api_key=openai_api_key)
self.chat_history = None
self.chain = None
self.db = None
def ask(self, question: str) -> str:
if self.chain is None:
response = "Please, add a document."
else:
response = self.chain({"question": question, "chat_history": self.chat_history})
response = response["answer"].strip()
self.chat_history.append((question, response))
return response
def ingest(self, file_path: os.PathLike) -> None:
loader = PyPDFLoader(file_path)
documents = loader.load()
splitted_documents = self.text_splitter.split_documents(documents)
if self.db is None:
self.db = FAISS.from_documents(splitted_documents, self.embeddings)
self.chain = ConversationalRetrievalChain.from_llm(self.llm, self.db.as_retriever())
self.chat_history = []
else:
self.db.add_documents(splitted_documents)
def forget(self) -> None:
self.db = None
self.chain = None
self.chat_history = None