awacke1 commited on
Commit
cc0c0af
1 Parent(s): d11a287

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -228,6 +228,7 @@ def pdf2txt(docs):
228
  if file_extension.lower() in ['py', 'txt', 'html', 'htm', 'xml', 'json']:
229
  text += file.getvalue().decode('utf-8')
230
  elif file_extension.lower() == 'pdf':
 
231
  pdf = PdfFileReader(BytesIO(file.getvalue()))
232
  for page in range(pdf.getNumPages()):
233
  text += pdf.getPage(page).extractText()
 
228
  if file_extension.lower() in ['py', 'txt', 'html', 'htm', 'xml', 'json']:
229
  text += file.getvalue().decode('utf-8')
230
  elif file_extension.lower() == 'pdf':
231
+ from PyPDF2 import PdfFileReader
232
  pdf = PdfFileReader(BytesIO(file.getvalue()))
233
  for page in range(pdf.getNumPages()):
234
  text += pdf.getPage(page).extractText()