Spaces:

Infinity-1995
/

Fake-Job-detection

Sleeping

Infinity-1995 commited on Oct 18

Commit

fb39cec

verified ·

1 Parent(s): d0f094c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,14 +10,16 @@ classifier = pipeline("text-classification", model="distilbert-base-uncased-fine
 def detect_job(text, file):
     extracted_text = ""
     if file:
-        filename = file.name
         if filename.endswith(".pdf"):
-            images = convert_from_bytes(file.read())
             for img in images:
                 extracted_text += pytesseract.image_to_string(img) + "\n"
         else:
-            img = Image.open(file)
             extracted_text = pytesseract.image_to_string(img)
     full_text = text + "\n" + extracted_text
     if full_text.strip() == "":
         return "No text provided!"
@@ -31,7 +33,7 @@ iface = gr.Interface(
     fn=detect_job,
     inputs=[
         gr.Textbox(lines=10, placeholder="Paste job description here..."),
-        gr.File(label="Upload PDF/Image", file_types=[".pdf", ".png", ".jpg", ".jpeg"], type="file")
     ],
     outputs="text",
     title="Fake Job Detector"

 def detect_job(text, file):
     extracted_text = ""
     if file:
+        filename = file.name if hasattr(file, "name") else "uploaded_file"
         if filename.endswith(".pdf"):
+            # file is bytes, convert PDF to images
+            images = convert_from_bytes(file.read() if hasattr(file, "read") else file)
             for img in images:
                 extracted_text += pytesseract.image_to_string(img) + "\n"
         else:
+            img = Image.open(file if hasattr(file, "read") else open(file, "rb"))
             extracted_text = pytesseract.image_to_string(img)
     full_text = text + "\n" + extracted_text
     if full_text.strip() == "":
         return "No text provided!"
     fn=detect_job,
     inputs=[
         gr.Textbox(lines=10, placeholder="Paste job description here..."),
+        gr.File(label="Upload PDF/Image", file_types=[".pdf", ".png", ".jpg", ".jpeg"], type="binary")
     ],
     outputs="text",
     title="Fake Job Detector"