Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -228,6 +228,7 @@ def pdf2txt(docs):
|
|
228 |
if file_extension.lower() in ['py', 'txt', 'html', 'htm', 'xml', 'json']:
|
229 |
text += file.getvalue().decode('utf-8')
|
230 |
elif file_extension.lower() == 'pdf':
|
|
|
231 |
pdf = PdfFileReader(BytesIO(file.getvalue()))
|
232 |
for page in range(pdf.getNumPages()):
|
233 |
text += pdf.getPage(page).extractText()
|
|
|
228 |
if file_extension.lower() in ['py', 'txt', 'html', 'htm', 'xml', 'json']:
|
229 |
text += file.getvalue().decode('utf-8')
|
230 |
elif file_extension.lower() == 'pdf':
|
231 |
+
from PyPDF2 import PdfFileReader
|
232 |
pdf = PdfFileReader(BytesIO(file.getvalue()))
|
233 |
for page in range(pdf.getNumPages()):
|
234 |
text += pdf.getPage(page).extractText()
|