Spaces:

gizemsarsinlar
/

Tesseract_OCR

Running

App Files Files Community

gizemsarsinlar commited on 20 days ago

Commit

7c963f3

•

1 Parent(s): 4cbfffc

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -46

app.py CHANGED Viewed

@@ -1,69 +1,53 @@
-from typing import List
 import pytesseract
 from PIL import Image
 import gradio as gr
 import cv2
 import numpy as np
-def tesseract_ocr_with_selection(filepath: str, coordinates: List[int] = None):
     # Görseli yükle
-    image = Image.open(filepath)
-    if coordinates:
-        # Koordinatlara göre kırp
-        x1, y1, x2, y2 = coordinates
-        image = image.crop((x1, y1, x2, y2))
-    # OCR işlemi (varsayılan dil: İngilizce)
-    return pytesseract.image_to_string(image=image, lang='eng')
-def parse_coordinates(coord_input: str):
-    """
-    Kullanıcıdan alınan koordinat stringini doğrula ve liste olarak döndür.
-    """
-    try:
-        # Koordinatları virgül ile ayır ve tam sayıya çevir
-        coords = [int(coord.strip()) for coord in coord_input.split(",")]
-        if len(coords) != 4:
-            raise ValueError("Lütfen tam olarak 4 koordinat girin (örnek: x1, y1, x2, y2).")
-        return coords
-    except ValueError:
-        raise ValueError("Hatalı koordinat formatı. Lütfen şu formatı kullanın: x1, y1, x2, y2.")
-# Gradio UI ayarları
-title = "Tesseract OCR with Selection"
-description = "Gradio demo for Tesseract OCR with region selection (default language: English)."
-article = "<p style='text-align: center'><a href='https://tesseract-ocr.github.io/' target='_blank'>Tesseract documentation</a> | <a href='https://github.com/tesseract-ocr/tesseract' target='_blank'>Github Repo</a></p>"
-# examples = [
-#     ['examples/eurotext.png', "50, 50, 200, 200"],
-#     ['examples/tesseract_sample.png', "30, 40, 150, 120"],
-# ]
 with gr.Blocks() as demo:
     with gr.Row():
-        gr.Markdown("# Tesseract OCR with Selection")
     with gr.Row():
-        img_input = gr.Image(type="filepath", label="Input Image")
-        coords_input = gr.Textbox(label="Selection Coordinates (x1, y1, x2, y2)", placeholder="50, 50, 200, 200")
     with gr.Row():
-        ocr_button = gr.Button("Run OCR with Selection")
     with gr.Row():
         ocr_output = gr.Textbox(label="OCR Result")
-    def run_with_selection(image_path, coordinates):
-        try:
-            # Koordinatları doğrula ve ayrıştır
-            coords = parse_coordinates(coordinates)
-            return tesseract_ocr_with_selection(image_path, coords)
-        except ValueError as e:
-            return str(e)  # Kullanıcıya hata mesajı göster
     ocr_button.click(
-        run_with_selection,
-        inputs=[img_input, coords_input],
         outputs=[ocr_output]
     )
-if __name__ == '__main__':
     demo.launch()

 import pytesseract
 from PIL import Image
 import gradio as gr
 import cv2
 import numpy as np
+def select_roi_and_ocr(filepath: str):
     # Görseli yükle
+    image = cv2.imread(filepath)
+    image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)  # Gradio ile uyumlu hale getirmek için
+    # Kullanıcıdan alan seçmesini iste
+    roi = cv2.selectROI("Alanı Seçin (ESC ile çıkın)", image_rgb, showCrosshair=True)
+    cv2.destroyAllWindows()
+    # Koordinatları al
+    x, y, w, h = roi
+    if w == 0 or h == 0:  # Hiçbir şey seçilmemişse
+        return "Hiçbir alan seçilmedi!"
+    # Seçilen alanı kırp
+    cropped_image = image[y:y+h, x:x+w]
+    cropped_image_pil = Image.fromarray(cv2.cvtColor(cropped_image, cv2.COLOR_BGR2RGB))  # OCR için PIL formatına dönüştür
+    # OCR işlemi
+    text = pytesseract.image_to_string(cropped_image_pil, lang="eng")
+    return text
+# Gradio arayüzü
 with gr.Blocks() as demo:
     with gr.Row():
+        gr.Markdown("## Tesseract OCR with Mouse Selection Box")
     with gr.Row():
+        img_input = gr.Image(type="filepath", label="Upload Image")
     with gr.Row():
+        ocr_button = gr.Button("Run OCR with Mouse Selection")
     with gr.Row():
         ocr_output = gr.Textbox(label="OCR Result")
+    def run_ocr_with_mouse_selection(image_path):
+        return select_roi_and_ocr(image_path)
     ocr_button.click(
+        run_ocr_with_mouse_selection,
+        inputs=[img_input],
         outputs=[ocr_output]
     )
+if __name__ == "__main__":
     demo.launch()