File size: 861 Bytes
6245545
 
5b8f3bd
6245545
5b8f3bd
6245545
 
 
 
 
 
 
 
 
 
 
5b8f3bd
6245545
 
5b8f3bd
6245545
5b8f3bd
 
6245545
 
5b8f3bd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from PyPDF2 import PdfReader
from transformers import pipeline
import gradio as gr

def summarize_pdf_content(files):
    summarizer = pipeline("summarization", model="stevhliu/my_awesome_billsum_model")
    summaries = []

    for file in files:
        with open(file.name, "rb") as pdf_file:
            pdf_reader = PdfReader(pdf_file)
            text = ""
            for page in pdf_reader.pages:
                text += page.extract_text() + "\n"
            summary = summarizer(text, max_length=50, min_length=10, do_sample=False)[0]['summary_text']
            summaries.append(summary)
    return summaries

iface = gr.Interface(
    fn=summarize_pdf_content,
    inputs=gr.UploadButton("Click to Upload a PDF", file_types=["pdf"], file_count="multiple"),
    outputs=gr.Textbox(label="Summarized Text"),
    title="PDF Summarizer"
)

iface.launch()