Spaces:

tony346
/

PDF_Llama

Runtime error

tony346 commited on Oct 11, 2023

Commit

e541bfb

•

1 Parent(s): f81421e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,7 +15,7 @@ from langchain.llms import HuggingFaceHub
 def get_pdf_text(pdf_docs):
     text = ''
     # pdf_file_ = open(pdf_docs,'rb')
-    # text = "example hojin"
     pdf_reader = PdfReader(pdf_docs)
     for page in pdf_reader.pages:
         text += page.extract_text()
@@ -32,7 +32,7 @@ def get_text_chunks(text):
     )
     # text_splitter = CharacterTextSplitter(
     #     separator="\n",
-    #     chunk_size=1000,
     #     chunk_overlap=200,
     #     length_function=len
     # )
@@ -105,7 +105,7 @@ def get_json_file(docs):
     # with open(docs, 'r') as f:
     json_data = json.load(docs)
-    for f_key, f_value in json_data.items():
         for s_value in f_value:
             text += str(f_key) + str(s_value)
         text += '\n'
@@ -139,8 +139,8 @@ def main():
         st.subheader("Your documents")
         docs = st.file_uploader(
             "Upload your PDFs here and click on 'Process'", accept_multiple_files=True)
-        if st.button("Process"):
-            with st.spinner("Processing"):f
                 # get pdf text
                 raw_text = ""
@@ -171,7 +171,7 @@ def main():
                 # create vector store
                 vectorstore = get_vectorstore(text_chunks)
                 # create conversation chain
                 st.session_state.conversation = get_conversation_chain(
                     vectorstore)

 def get_pdf_text(pdf_docs):
     text = ''
     # pdf_file_ = open(pdf_docs,'rb')
+    # text = "example hofjin"
     pdf_reader = PdfReader(pdf_docs)
     for page in pdf_reader.pages:
         text += page.extract_text()
     )
     # text_splitter = CharacterTextSplitter(
     #     separator="\n",
+    #     chunk_size=10f00,
     #     chunk_overlap=200,
     #     length_function=len
     # )
     # with open(docs, 'r') as f:
     json_data = json.load(docs)
+f    for f_key, f_value in json_data.items():
         for s_value in f_value:
             text += str(f_key) + str(s_value)
         text += '\n'
         st.subheader("Your documents")
         docs = st.file_uploader(
             "Upload your PDFs here and click on 'Process'", accept_multiple_files=True)
+        if st.button("Process"):f
+            with st.spinner("Processing"):
                 # get pdf text
                 raw_text = ""
                 # create vector store
                 vectorstore = get_vectorstore(text_chunks)
+f
                 # create conversation chain
                 st.session_state.conversation = get_conversation_chain(
                     vectorstore)