Spaces:

Rivalcoder
/

Pdf-Processing

Sleeping

Rivalcoder commited on 18 days ago

Commit

ff08e35

1 Parent(s): 4de3353

Add application file

Files changed (1) hide show

app.py ADDED Viewed

+import fitz  # PyMuPDF
+import gradio as gr
+def extract_text_from_pdf(file):
+    if file is None:
+        return "No file uploaded."
+    try:
+        doc = fitz.open(stream=file.read(), filetype="pdf")
+        full_text = ""
+        for page_num in range(len(doc)):
+            page = doc.load_page(page_num)
+            text = page.get_text()
+            full_text += f"\n\n--- Page {page_num + 1} ---\n\n{text}"
+        return full_text
+    except Exception as e:
+        return f"Error: {str(e)}"
+gr.Interface(
+    fn=extract_text_from_pdf,
+    inputs=gr.File(label="Upload PDF", file_types=[".pdf"]),
+    outputs="text",
+    title="PDF to Text Extractor",
+    description="Upload a PDF file and get all the extracted text from each page.",
+).launch()