File size: 550 Bytes
7fc9541
1730056
7fc9541
 
 
 
 
 
 
7851bae
0b13398
 
 
 
 
 
 
 
 
 
 
 
7851bae
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
from io import StringIO 

tokenizer = AutoTokenizer.from_pretrained("facebook/bart-large-cnn")
model = AutoModelForSeq2SeqLM.from_pretrained("facebook/bart-large-cnn")

import streamlit as st
import os

import PyPDF2
import fitz


uploaded_pdf = st.file_uploader("Load pdf: ", type=['pdf'])

if uploaded_pdf is not None:
    doc = fitz.open(stream=uploaded_pdf.read(), filetype="pdf")
    text = ""
    for page in doc:
        text += page.getText()
    st.write(text) 
    doc.close()