llamaChatBot / chatBot /common /pdfToText.py
Th3BossC's picture
initial commit
23d152f
from langchain.document_loaders import PyPDFLoader
import os
pdfLocation = 'chatBot/static/pdfs/'
def loadLatestPdf():
pdfCount = len(os.listdir(pdfLocation))
loader = PyPDFLoader(f"{pdfLocation}/{pdfCount}.pdf")
pages = loader.load_and_split()
data=pages
return data