toshiba_2.O / app.py
neerajkalyank's picture
Update app.py
8f0b178 verified
raw
history blame
773 Bytes
import subprocess
import camelot
import pandas as pd
import gradio as gr
def install_ghostscript():
subprocess.run(["apt-get", "update"])
subprocess.run(["apt-get", "install", "-y", "ghostscript"])
def extract_tables(pdf_file):
try:
tables = camelot.read_pdf(pdf_file.name, pages="all")
df = pd.concat([table.df for table in tables], ignore_index=True)
return df
except OSError:
install_ghostscript()
return "Ghostscript installed. Please retry."
demo = gr.Interface(
fn=extract_tables,
inputs=gr.File(label="Upload PDF"),
outputs=gr.DataFrame(label="Extracted Tables"),
title="PDF Table Extractor",
description="Extract tables from PDF files.",
)
if __name__ == "__main__":
demo.launch()