Mishmosh commited on
Commit
9b952ec
1 Parent(s): 1f56077

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -10
app.py CHANGED
@@ -1,11 +1,11 @@
1
  # https://huggingface.co/spaces/Mishmosh/MichelleAssessment3
2
- !pip install PyPDF2
3
- !pip install sentencepiece
4
- !pip install pdfminer.six
5
- !pip install pdfplumber
6
- !pip install pdf2image
7
- !pip install Pillow
8
- !pip install pytesseract
9
  # @title
10
  !apt-get install poppler-utils
11
  !apt install tesseract-ocr
@@ -210,11 +210,11 @@ def read_pdf(pdf_path):
210
  return text_per_page
211
 
212
  #google drive
213
- from google.colab import drive
214
- drive.mount('/content/drive')
215
  #read PDF
216
 
217
- pdf_path = '/content/drive/MyDrive/ArticleHidden.pdf' #article 11
218
 
219
  text_per_page = read_pdf(pdf_path)
220
 
 
1
  # https://huggingface.co/spaces/Mishmosh/MichelleAssessment3
2
+ #!pip install PyPDF2
3
+ #!pip install sentencepiece
4
+ #!pip install pdfminer.six
5
+ #!pip install pdfplumber
6
+ #!pip install pdf2image
7
+ #!pip install Pillow
8
+ #!pip install pytesseract
9
  # @title
10
  !apt-get install poppler-utils
11
  !apt install tesseract-ocr
 
210
  return text_per_page
211
 
212
  #google drive
213
+ #from google.colab import drive
214
+ #drive.mount('/content/drive')
215
  #read PDF
216
 
217
+ pdf_path = 'https://huggingface.co/spaces/Mishmosh/MichelleAssessment3/blob/main/Article%2011%20Hidden%20Technical%20Debt%20in%20Machine%20Learning%20Systems.pdf' #article 11
218
 
219
  text_per_page = read_pdf(pdf_path)
220