Commit
•
e5dd1fd
1
Parent(s):
6eaafd9
Update app.py
Browse files
app.py
CHANGED
@@ -3,7 +3,7 @@ from PIL import Image
|
|
3 |
import textwrap
|
4 |
import google.generativeai as genai
|
5 |
import os
|
6 |
-
import
|
7 |
|
8 |
# Function to display formatted Markdown text
|
9 |
def to_markdown(text):
|
@@ -24,11 +24,11 @@ def generate_gemini_content(prompt, model_name='gemini-pro-vision', image=None):
|
|
24 |
def extract_text_from_pdf(pdf_path):
|
25 |
text = ""
|
26 |
with open(pdf_path, 'rb') as file:
|
27 |
-
pdf_reader =
|
28 |
-
num_pages = pdf_reader.
|
29 |
for page_num in range(num_pages):
|
30 |
-
page = pdf_reader.
|
31 |
-
text += page.
|
32 |
return text
|
33 |
|
34 |
# Function to process PDFs in a folder
|
|
|
3 |
import textwrap
|
4 |
import google.generativeai as genai
|
5 |
import os
|
6 |
+
from PyPDF2 import PdfReader
|
7 |
|
8 |
# Function to display formatted Markdown text
|
9 |
def to_markdown(text):
|
|
|
24 |
def extract_text_from_pdf(pdf_path):
|
25 |
text = ""
|
26 |
with open(pdf_path, 'rb') as file:
|
27 |
+
pdf_reader = PdfReader(file)
|
28 |
+
num_pages = len(pdf_reader.pages)
|
29 |
for page_num in range(num_pages):
|
30 |
+
page = pdf_reader.pages[page_num]
|
31 |
+
text += page.extract_text()
|
32 |
return text
|
33 |
|
34 |
# Function to process PDFs in a folder
|