Spaces:

IRVLUTD
/

DH-YOLO

Sleeping

App Files Files Community

hololens commited on Sep 30, 2024

Commit

ec41162

•

1 Parent(s): 326f023

init commit

Browse files

Files changed (6) hide show

app.py +102 -0
pretrained_ckpts/dh-yolo-exp-31-pb-1532.pt +3 -0
pretrained_ckpts/dh-yolo-exp-31-pl-1532.pt +3 -0
pretrained_ckpts/dh-yolo-exp27-pb-1008.pt +3 -0
pretrained_ckpts/dh-yolo-v1-pb-ddf-524.pt +3 -0
requirements.txt +4 -0

app.py ADDED Viewed

	@@ -0,0 +1,102 @@

+import os
+import logging
+import gradio as gr
+from PIL import Image as PILImg
+from iteach_toolkit.DHYOLO import DHYOLODetector
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+def detect_objects(selected_model, input_image, conf, imu_threshold, detections):
+    try:
+        model_path = model_options[selected_model]
+        dhyolo = DHYOLODetector(model_path)
+        # Save the input image temporarily to a path for processing
+        input_image_path = "dhyolo_temp_input_image.jpg"
+        input_image.save(input_image_path)
+        # Perform prediction on the image
+        orig_image, detections = dhyolo.predict(input_image_path, conf, imu_threshold, detections)
+        # Log the detections
+        logger.info("Detections: %s", detections)
+        # Plot the bounding boxes on the original image
+        orig_image, image_with_bboxes = dhyolo.plot_bboxes(attach_watermark=True)
+        # Convert the image (with bounding boxes) from a NumPy array to a PIL Image for display.
+        pil_img_with_bboxes = PILImg.fromarray(image_with_bboxes)
+        return input_image, pil_img_with_bboxes
+    except FileNotFoundError as e:
+        logger.error("File not found: %s", e)
+        return None, None
+    except Exception as e:
+        logger.error("An error occurred: %s", e)
+        return None, None
+def load_test_images():
+    """Load images from the test_imgs directory."""
+    test_imgs_dir = os.path.join(os.getcwd(), "test_imgs")
+    logger.info("Loading images from: %s", test_imgs_dir)  # Log the directory path
+    return [f for f in os.listdir(test_imgs_dir) if f.lower().endswith(('.png', '.jpg', '.jpeg'))]
+# Gradio interface
+def create_interface():
+    with gr.Blocks() as demo:
+        # Center the title using HTML
+        gr.Markdown("<h1 style='text-align: center;'>🚪🔍 DHYOLO DoorHandle Object Detection</h1>")
+        # Add paper description with correct hyperlink syntax
+        gr.Markdown("<h2 style='text-align: center;'>📚 iTeach: Interactive Teaching for Robot Perception using Mixed Reality</h2>")
+        # Add the project link using HTML <a> tag
+        gr.Markdown("<h2 style='text-align: center;'>🌐 Project Link: <a href='https://irvlutd.github.io/iTeach/' target='_blank'>iTeach Project</a></h2>")
+        with gr.Row():
+            with gr.Column():
+                # Load a default image for input
+                default_image_path = os.path.join(os.getcwd(), "test_imgs", "irvl-ters.jpg")  # Update with the correct default image name
+                # Attempt to open the default image and log if it fails
+                try:
+                    default_image = PILImg.open(default_image_path)
+                except FileNotFoundError:
+                    logger.error("Default image not found at: %s", default_image_path)
+                    default_image = None  # Set to None or a placeholder image
+                input_image = gr.Image(type="pil", label="Input Image", value=default_image)
+                # Pretrained model paths
+                cwd = os.getcwd()
+                global model_options
+                model_options = {
+                    "dh-yolo-v1-pb-ddf-524": f'{cwd}/pretrained_ckpts/dh-yolo-v1-pb-ddf-524.pt',
+                    "dh-yolo-exp27-pb-1008": f'{cwd}/pretrained_ckpts/dh-yolo-exp27-pb-1008.pt',
+                    "dh-yolo-exp31-pb-1532": f'{cwd}/pretrained_ckpts/dh-yolo-exp-31-pb-1532.pt',
+                    "dh-yolo-exp31-pl-1532": f'{cwd}/pretrained_ckpts/dh-yolo-exp-31-pl-1532.pt'
+                }
+                model_path = gr.Dropdown(choices=list(model_options.keys()), label="Select Pretrained Model", value="dh-yolo-v1-pb-ddf-524")
+                conf = gr.Slider(label="Confidence Threshold", minimum=0.0, maximum=1.0, step=0.01, value=0.5)
+                imu_threshold = gr.Slider(label="IMU Threshold", minimum=0.0, maximum=1.0, step=0.01, value=0.5)
+                detections = gr.Slider(label="Max number of Detections", minimum=1, maximum=100, step=1, value=10)
+            with gr.Column():
+                output_image = gr.Image(label="Output Image with DH-YOLO Detections", type="pil")
+        detect_button = gr.Button("Run")
+        # Detect button functionality
+        detect_button.click(detect_objects, inputs=[model_path, input_image, conf, imu_threshold, detections],
+                            outputs=[input_image, output_image])
+    return demo
+if __name__ == "__main__":
+    demo = create_interface()
+    demo.launch()

pretrained_ckpts/dh-yolo-exp-31-pb-1532.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:625a45abe7ae0e7d52a7528915f45408a93865fc9711e42663a37ce61890e68f
+size 42181652

pretrained_ckpts/dh-yolo-exp-31-pl-1532.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a94b4f8d0f6d965a9de0cf3e22ce3f478bd198eca858e5cce7522393ca07190f
+size 42181652

pretrained_ckpts/dh-yolo-exp27-pb-1008.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a419efeb648285e265195fab71d1e23bc8a95b386f1b10e5bc80abedb26a1859
+size 42181652

pretrained_ckpts/dh-yolo-v1-pb-ddf-524.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0179ed926a58f2c379dda9fbfa15cbca23cefc058554efd9325e4d5f5531e81
+size 42181652

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+gradio
+Pillow
+iteach_toolkit
+opencv-python