Spaces:

Gradio-Blocks
/

ViTPose

Running

App Files Files Community

hysts HF staff commited on Mar 15, 2023

Commit

5a9bbeb

•

1 Parent(s): 1da2a40

Update

Browse files

Files changed (3) hide show

README.md +1 -1
app.py +126 -162
model.py +12 -9

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 📊
 colorFrom: yellow
 colorTo: indigo
 sdk: gradio
-sdk_version: 3.1.1
 app_file: app.py
 pinned: false
 ---

 colorFrom: yellow
 colorTo: indigo
 sdk: gradio
+sdk_version: 3.21.0
 app_file: app.py
 pinned: false
 ---

app.py CHANGED Viewed

@@ -10,22 +10,7 @@ import gradio as gr
 from model import AppDetModel, AppPoseModel
-DESCRIPTION = '''# ViTPose
-This is an unofficial demo for [https://github.com/ViTAE-Transformer/ViTPose](https://github.com/ViTAE-Transformer/ViTPose).'''
-FOOTER = '<img id="visitor-badge" alt="visitor badge" src="https://visitor-badge.glitch.me/badge?page_id=hysts.vitpose" />'
-def parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser()
-    parser.add_argument('--device', type=str, default='cpu')
-    parser.add_argument('--theme', type=str)
-    parser.add_argument('--share', action='store_true')
-    parser.add_argument('--port', type=int)
-    parser.add_argument('--disable-queue',
-                        dest='enable_queue',
-                        action='store_false')
-    return parser.parse_args()
 def set_example_image(example: list) -> dict:
@@ -39,161 +24,140 @@ def extract_tar() -> None:
         f.extractall('mmdet_configs')
-def main():
-    args = parse_args()
-    extract_tar()
-    det_model = AppDetModel(device=args.device)
-    pose_model = AppPoseModel(device=args.device)
-    with gr.Blocks(theme=args.theme, css='style.css') as demo:
-        gr.Markdown(DESCRIPTION)
-        with gr.Box():
-            gr.Markdown('## Step 1')
-            with gr.Row():
-                with gr.Column():
-                    with gr.Row():
-                        input_image = gr.Image(label='Input Image',
-                                               type='numpy')
-                    with gr.Row():
-                        detector_name = gr.Dropdown(list(
-                            det_model.MODEL_DICT.keys()),
-                                                    value=det_model.model_name,
-                                                    label='Detector')
-                    with gr.Row():
-                        detect_button = gr.Button(value='Detect')
-                        det_preds = gr.Variable()
-                with gr.Column():
-                    with gr.Row():
-                        detection_visualization = gr.Image(
-                            label='Detection Result',
-                            type='numpy',
-                            elem_id='det-result')
-                    with gr.Row():
-                        vis_det_score_threshold = gr.Slider(
-                            0,
-                            1,
-                            step=0.05,
-                            value=0.5,
-                            label='Visualization Score Threshold')
-                    with gr.Row():
-                        redraw_det_button = gr.Button(value='Redraw')
-            with gr.Row():
-                paths = sorted(pathlib.Path('images').rglob('*.jpg'))
-                example_images = gr.Dataset(components=[input_image],
-                                            samples=[[path.as_posix()]
-                                                     for path in paths])
-        with gr.Box():
-            gr.Markdown('## Step 2')
-            with gr.Row():
-                with gr.Column():
-                    with gr.Row():
-                        pose_model_name = gr.Dropdown(
-                            list(pose_model.MODEL_DICT.keys()),
-                            value=pose_model.model_name,
-                            label='Pose Model')
-                    det_score_threshold = gr.Slider(
-                        0,
-                        1,
                         step=0.05,
-                        value=0.5,
-                        label='Box Score Threshold')
-                    with gr.Row():
-                        predict_button = gr.Button(value='Predict')
-                        pose_preds = gr.Variable()
-                with gr.Column():
-                    with gr.Row():
-                        pose_visualization = gr.Image(label='Result',
-                                                      type='numpy',
-                                                      elem_id='pose-result')
-                    with gr.Row():
-                        vis_kpt_score_threshold = gr.Slider(
-                            0,
-                            1,
-                            step=0.05,
-                            value=0.3,
-                            label='Visualization Score Threshold')
-                    with gr.Row():
-                        vis_dot_radius = gr.Slider(1,
-                                                   10,
                                                    step=1,
-                                                   value=4,
-                                                   label='Dot Radius')
-                    with gr.Row():
-                        vis_line_thickness = gr.Slider(1,
-                                                       10,
-                                                       step=1,
-                                                       value=2,
-                                                       label='Line Thickness')
-                    with gr.Row():
-                        redraw_pose_button = gr.Button(value='Redraw')
-        gr.Markdown(FOOTER)
-        detector_name.change(fn=det_model.set_model,
-                             inputs=detector_name,
-                             outputs=None)
-        detect_button.click(fn=det_model.run,
                             inputs=[
-                                detector_name,
                                 input_image,
                                 vis_det_score_threshold,
                             ],
-                            outputs=[
-                                det_preds,
-                                detection_visualization,
-                            ])
-        redraw_det_button.click(fn=det_model.visualize_detection_results,
-                                inputs=[
-                                    input_image,
-                                    det_preds,
-                                    vis_det_score_threshold,
-                                ],
-                                outputs=detection_visualization)
-        pose_model_name.change(fn=pose_model.set_model,
-                               inputs=pose_model_name,
-                               outputs=None)
-        predict_button.click(fn=pose_model.run,
                              inputs=[
-                                 pose_model_name,
                                  input_image,
-                                 det_preds,
-                                 det_score_threshold,
                                  vis_kpt_score_threshold,
                                  vis_dot_radius,
                                  vis_line_thickness,
                              ],
-                             outputs=[
-                                 pose_preds,
-                                 pose_visualization,
-                             ])
-        redraw_pose_button.click(fn=pose_model.visualize_pose_results,
-                                 inputs=[
-                                     input_image,
-                                     pose_preds,
-                                     vis_kpt_score_threshold,
-                                     vis_dot_radius,
-                                     vis_line_thickness,
-                                 ],
-                                 outputs=pose_visualization)
-        example_images.click(
-            fn=set_example_image,
-            inputs=example_images,
-            outputs=input_image,
-        )
-    demo.launch(
-        enable_queue=args.enable_queue,
-        server_port=args.port,
-        share=args.share,
-    )
-if __name__ == '__main__':
-    main()

 from model import AppDetModel, AppPoseModel
+DESCRIPTION = '# [ViTPose](https://github.com/ViTAE-Transformer/ViTPose)'
 def set_example_image(example: list) -> dict:
         f.extractall('mmdet_configs')
+extract_tar()
+det_model = AppDetModel()
+pose_model = AppPoseModel()
+with gr.Blocks(css='style.css') as demo:
+    gr.Markdown(DESCRIPTION)
+    with gr.Box():
+        gr.Markdown('## Step 1')
+        with gr.Row():
+            with gr.Column():
+                with gr.Row():
+                    input_image = gr.Image(label='Input Image', type='numpy')
+                with gr.Row():
+                    detector_name = gr.Dropdown(
+                        label='Detector',
+                        choices=list(det_model.MODEL_DICT.keys()),
+                        value=det_model.model_name)
+                with gr.Row():
+                    detect_button = gr.Button('Detect')
+                    det_preds = gr.Variable()
+            with gr.Column():
+                with gr.Row():
+                    detection_visualization = gr.Image(
+                        label='Detection Result',
+                        type='numpy',
+                        elem_id='det-result')
+                with gr.Row():
+                    vis_det_score_threshold = gr.Slider(
+                        label='Visualization Score Threshold',
+                        minimum=0,
+                        maximum=1,
                         step=0.05,
+                        value=0.5)
+                with gr.Row():
+                    redraw_det_button = gr.Button(value='Redraw')
+        with gr.Row():
+            paths = sorted(pathlib.Path('images').rglob('*.jpg'))
+            example_images = gr.Examples(examples=[[path.as_posix()]
+                                                   for path in paths],
+                                         inputs=input_image)
+    with gr.Box():
+        gr.Markdown('## Step 2')
+        with gr.Row():
+            with gr.Column():
+                with gr.Row():
+                    pose_model_name = gr.Dropdown(
+                        label='Pose Model',
+                        choices=list(pose_model.MODEL_DICT.keys()),
+                        value=pose_model.model_name)
+                det_score_threshold = gr.Slider(label='Box Score Threshold',
+                                                minimum=0,
+                                                maximum=1,
+                                                step=0.05,
+                                                value=0.5)
+                with gr.Row():
+                    predict_button = gr.Button('Predict')
+                    pose_preds = gr.Variable()
+            with gr.Column():
+                with gr.Row():
+                    pose_visualization = gr.Image(label='Result',
+                                                  type='numpy',
+                                                  elem_id='pose-result')
+                with gr.Row():
+                    vis_kpt_score_threshold = gr.Slider(
+                        label='Visualization Score Threshold',
+                        minimum=0,
+                        maximum=1,
+                        step=0.05,
+                        value=0.3)
+                with gr.Row():
+                    vis_dot_radius = gr.Slider(label='Dot Radius',
+                                               minimum=1,
+                                               maximum=10,
+                                               step=1,
+                                               value=4)
+                with gr.Row():
+                    vis_line_thickness = gr.Slider(label='Line Thickness',
+                                                   minimum=1,
+                                                   maximum=10,
                                                    step=1,
+                                                   value=2)
+                with gr.Row():
+                    redraw_pose_button = gr.Button('Redraw')
+    detector_name.change(fn=det_model.set_model,
+                         inputs=detector_name,
+                         outputs=None)
+    detect_button.click(fn=det_model.run,
+                        inputs=[
+                            detector_name,
+                            input_image,
+                            vis_det_score_threshold,
+                        ],
+                        outputs=[
+                            det_preds,
+                            detection_visualization,
+                        ])
+    redraw_det_button.click(fn=det_model.visualize_detection_results,
                             inputs=[
                                 input_image,
+                                det_preds,
                                 vis_det_score_threshold,
                             ],
+                            outputs=detection_visualization)
+    pose_model_name.change(fn=pose_model.set_model,
+                           inputs=pose_model_name,
+                           outputs=None)
+    predict_button.click(fn=pose_model.run,
+                         inputs=[
+                             pose_model_name,
+                             input_image,
+                             det_preds,
+                             det_score_threshold,
+                             vis_kpt_score_threshold,
+                             vis_dot_radius,
+                             vis_line_thickness,
+                         ],
+                         outputs=[
+                             pose_preds,
+                             pose_visualization,
+                         ])
+    redraw_pose_button.click(fn=pose_model.visualize_pose_results,
                              inputs=[
                                  input_image,
+                                 pose_preds,
                                  vis_kpt_score_threshold,
                                  vis_dot_radius,
                                  vis_line_thickness,
                              ],
+                             outputs=pose_visualization)
+demo.queue(api_open=False).launch()

model.py CHANGED Viewed

@@ -2,6 +2,7 @@ from __future__ import annotations
 import os
 import pathlib
 import subprocess
 import sys
@@ -11,9 +12,9 @@ if os.getenv('SYSTEM') == 'spaces':
     mim.uninstall('mmcv-full', confirm_yes=True)
     mim.install('mmcv-full==1.5.0', is_yes=True)
-    subprocess.run('pip uninstall -y opencv-python'.split())
-    subprocess.run('pip uninstall -y opencv-python-headless'.split())
-    subprocess.run('pip install opencv-python-headless==4.5.5.64'.split())
 import huggingface_hub
 import numpy as np
@@ -21,14 +22,14 @@ import torch
 import torch.nn as nn
 app_dir = pathlib.Path(__file__).parent
-submodule_dir = app_dir / 'ViTPose/'
 sys.path.insert(0, submodule_dir.as_posix())
 from mmdet.apis import inference_detector, init_detector
 from mmpose.apis import (inference_top_down_pose_model, init_pose_model,
                          process_mmdet_results, vis_pose_result)
-HF_TOKEN = os.environ['HF_TOKEN']
 class DetModel:
@@ -59,8 +60,9 @@ class DetModel:
         },
     }
-    def __init__(self, device: str | torch.device):
-        self.device = torch.device(device)
         self._load_all_models_once()
         self.model_name = 'YOLOX-l'
         self.model = self._load_model(self.model_name)
@@ -139,8 +141,9 @@ class PoseModel:
         },
     }
-    def __init__(self, device: str | torch.device):
-        self.device = torch.device(device)
         self.model_name = 'ViTPose-B (multi-task train, COCO)'
         self.model = self._load_model(self.model_name)

 import os
 import pathlib
+import shlex
 import subprocess
 import sys
     mim.uninstall('mmcv-full', confirm_yes=True)
     mim.install('mmcv-full==1.5.0', is_yes=True)
+    subprocess.run(shlex.split('pip uninstall -y opencv-python'))
+    subprocess.run(shlex.split('pip uninstall -y opencv-python-headless'))
+    subprocess.run(shlex.split('pip install opencv-python-headless==4.5.5.64'))
 import huggingface_hub
 import numpy as np
 import torch.nn as nn
 app_dir = pathlib.Path(__file__).parent
+submodule_dir = app_dir / 'ViTPose'
 sys.path.insert(0, submodule_dir.as_posix())
 from mmdet.apis import inference_detector, init_detector
 from mmpose.apis import (inference_top_down_pose_model, init_pose_model,
                          process_mmdet_results, vis_pose_result)
+HF_TOKEN = os.getenv('HF_TOKEN')
 class DetModel:
         },
     }
+    def __init__(self):
+        self.device = torch.device(
+            'cuda:0' if torch.cuda.is_available() else 'cpu')
         self._load_all_models_once()
         self.model_name = 'YOLOX-l'
         self.model = self._load_model(self.model_name)
         },
     }
+    def __init__(self):
+        self.device = torch.device(
+            'cuda:0' if torch.cuda.is_available() else 'cpu')
         self.model_name = 'ViTPose-B (multi-task train, COCO)'
         self.model = self._load_model(self.model_name)