wholewhale commited on
Commit
a41389e
1 Parent(s): 7c40be6
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -4,6 +4,7 @@ from langchain.document_loaders import OnlinePDFLoader
4
  from langchain.text_splitter import CharacterTextSplitter
5
  from langchain.chat_models import ChatAnthropic
6
  from langchain.prompts import ChatPromptTemplate
 
7
 
8
  # Set API keys from environment variables
9
  os.environ['ANTHROPIC_API_KEY'] = os.getenv("ANTHROPIC_API_KEY")
@@ -16,11 +17,12 @@ def load_pdf(pdf_doc):
16
  if pdf_doc is None:
17
  return "No PDF uploaded."
18
 
19
- # Load and split PDF content
20
  loader = OnlinePDFLoader(pdf_doc.name)
21
  documents = loader.load()
22
- text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
23
- pdf_content = ' '.join(text_splitter.split_documents(documents))
 
24
 
25
  return "PDF Loaded Successfully."
26
 
 
4
  from langchain.text_splitter import CharacterTextSplitter
5
  from langchain.chat_models import ChatAnthropic
6
  from langchain.prompts import ChatPromptTemplate
7
+ from langchain.document_loaders import TextLoader
8
 
9
  # Set API keys from environment variables
10
  os.environ['ANTHROPIC_API_KEY'] = os.getenv("ANTHROPIC_API_KEY")
 
17
  if pdf_doc is None:
18
  return "No PDF uploaded."
19
 
20
+ # Load PDF content
21
  loader = OnlinePDFLoader(pdf_doc.name)
22
  documents = loader.load()
23
+
24
+ # Assuming the `documents` is a list of strings representing each page
25
+ pdf_content = ' '.join(documents)
26
 
27
  return "PDF Loaded Successfully."
28