Spaces:

Tonic
/

GOT-OCR

Running on Zero

App Files Files Community

Tonic commited on Sep 13

Commit

68e36bf

•

1 Parent(s): 4a9ef6f

do it normally

Browse files

Files changed (1) hide show

app.py +9 -16

app.py CHANGED Viewed

@@ -49,8 +49,6 @@ model = AutoModel.from_pretrained('ucaslcl/GOT-OCR2_0', trust_remote_code=True,
 model = model.eval().cuda()
 model.config.pad_token_id = tokenizer.eos_token_id
 def save_image_to_temp_file(image):
     with tempfile.NamedTemporaryFile(delete=False, suffix=".png") as temp_file:
         image.save(temp_file, format="PNG")
@@ -62,32 +60,27 @@ def process_image(image, task, ocr_type=None, ocr_box=None, ocr_color=None):
         if image is None:
             return "No image provided", None
-        # Save the PIL Image to a temporary file
         temp_image_path = save_image_to_temp_file(image)
-        with io.BytesIO() as buffer:
-            pil_image.save(buffer, format="PNG")
-            image_path = "/tmp/temp_image.png"
-            with open(image_path, "wb") as f:
-                f.write(buffer.getvalue())
         if task == "Plain Text OCR":
-            res = model.chat(tokenizer, image, ocr_type='ocr')
         elif task == "Format Text OCR":
-            res = model.chat(tokenizer, image, ocr_type='format')
         elif task == "Fine-grained OCR (Box)":
-            res = model.chat(tokenizer, image, ocr_type=ocr_type, ocr_box=ocr_box)
         elif task == "Fine-grained OCR (Color)":
-            res = model.chat(tokenizer, image, ocr_type=ocr_type, ocr_color=ocr_color)
         elif task == "Multi-crop OCR":
-            res = model.chat_crop(tokenizer, image_file=image)
         elif task == "Render Formatted OCR":
-            res = model.chat(tokenizer, image, ocr_type='format', render=True, save_render_file='./results/demo.html')
             with open('./results/demo.html', 'r') as f:
                 html_content = f.read()
             return res, html_content
-        os.remove(image_path)
         return res, None
     except Exception as e:

 model = model.eval().cuda()
 model.config.pad_token_id = tokenizer.eos_token_id
 def save_image_to_temp_file(image):
     with tempfile.NamedTemporaryFile(delete=False, suffix=".png") as temp_file:
         image.save(temp_file, format="PNG")
         if image is None:
             return "No image provided", None
         temp_image_path = save_image_to_temp_file(image)
         if task == "Plain Text OCR":
+            res = model.chat(tokenizer, temp_image_path, ocr_type='ocr')
         elif task == "Format Text OCR":
+            res = model.chat(tokenizer, temp_image_path, ocr_type='format')
         elif task == "Fine-grained OCR (Box)":
+            res = model.chat(tokenizer, temp_image_path, ocr_type=ocr_type, ocr_box=ocr_box)
         elif task == "Fine-grained OCR (Color)":
+            res = model.chat(tokenizer, temp_image_path, ocr_type=ocr_type, ocr_color=ocr_color)
         elif task == "Multi-crop OCR":
+            res = model.chat_crop(tokenizer, image_file=temp_image_path)
         elif task == "Render Formatted OCR":
+            res = model.chat(tokenizer, temp_image_path, ocr_type='format', render=True, save_render_file='./results/demo.html')
             with open('./results/demo.html', 'r') as f:
                 html_content = f.read()
+            os.remove(temp_image_path)
             return res, html_content
+        # Clean up
+        os.remove(temp_image_path)
         return res, None
     except Exception as e: