Spaces:
Sleeping
Sleeping
File size: 356 Bytes
b6e3c51 |
1 2 3 4 5 6 7 8 9 10 11 12 13 |
import os
import fitz # PyMuPDF
def extract_text_from_file(file_obj):
name = file_obj.name
if name.endswith(".pdf"):
doc = fitz.open(stream=file_obj.read(), filetype="pdf")
return "\n".join(page.get_text() for page in doc)
elif name.endswith(".txt"):
return file_obj.read().decode("utf-8")
else:
return ""
|