ControlNet-with-GPT-4

Runtime error

App Files Files Community

hysts HF Staff commited on Oct 2, 2023

Commit

f521e88

1 Parent(s): 89efab8

Migrate from yapf to black

Browse files

Files changed (21) hide show

.pre-commit-config.yaml +54 -35
.style.yapf +0 -5
.vscode/settings.json +11 -8
app.py +33 -37
app_canny.py +32 -52
app_depth.py +32 -51
app_ip2p.py +28 -42
app_lineart.py +39 -57
app_mlsd.py +34 -57
app_normal.py +33 -51
app_openpose.py +33 -51
app_scribble.py +32 -51
app_scribble_interactive.py +43 -53
app_segmentation.py +33 -51
app_shuffle.py +30 -46
app_softedge.py +42 -57
depth_estimator.py +4 -4
image_segmentor.py +7 -13
model.py +90 -90
preprocessor.py +32 -24
settings.py +7 -10

.pre-commit-config.yaml CHANGED Viewed

@@ -1,36 +1,55 @@
 repos:
-- repo: https://github.com/pre-commit/pre-commit-hooks
-  rev: v4.2.0
-  hooks:
-  - id: check-executables-have-shebangs
-  - id: check-json
-  - id: check-merge-conflict
-  - id: check-shebang-scripts-are-executable
-  - id: check-toml
-  - id: check-yaml
-  - id: double-quote-string-fixer
-  - id: end-of-file-fixer
-  - id: mixed-line-ending
-    args: ['--fix=lf']
-  - id: requirements-txt-fixer
-  - id: trailing-whitespace
-- repo: https://github.com/myint/docformatter
-  rev: v1.4
-  hooks:
-  - id: docformatter
-    args: ['--in-place']
-- repo: https://github.com/pycqa/isort
-  rev: 5.12.0
-  hooks:
-    - id: isort
-- repo: https://github.com/pre-commit/mirrors-mypy
-  rev: v0.991
-  hooks:
-    - id: mypy
-      args: ['--ignore-missing-imports']
-      additional_dependencies: ['types-python-slugify']
-- repo: https://github.com/google/yapf
-  rev: v0.32.0
-  hooks:
-  - id: yapf
-    args: ['--parallel', '--in-place']

 repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.4.0
+    hooks:
+      - id: check-executables-have-shebangs
+      - id: check-json
+      - id: check-merge-conflict
+      - id: check-shebang-scripts-are-executable
+      - id: check-toml
+      - id: check-yaml
+      - id: end-of-file-fixer
+      - id: mixed-line-ending
+        args: ["--fix=lf"]
+      - id: requirements-txt-fixer
+      - id: trailing-whitespace
+  - repo: https://github.com/myint/docformatter
+    rev: v1.7.5
+    hooks:
+      - id: docformatter
+        args: ["--in-place"]
+  - repo: https://github.com/pycqa/isort
+    rev: 5.12.0
+    hooks:
+      - id: isort
+        args: ["--profile", "black"]
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.5.1
+    hooks:
+      - id: mypy
+        args: ["--ignore-missing-imports"]
+        additional_dependencies:
+          ["types-python-slugify", "types-requests", "types-PyYAML"]
+  - repo: https://github.com/psf/black
+    rev: 23.9.1
+    hooks:
+      - id: black
+        language_version: python3.10
+        args: ["--line-length", "119"]
+  - repo: https://github.com/kynan/nbstripout
+    rev: 0.6.1
+    hooks:
+      - id: nbstripout
+        args:
+          [
+            "--extra-keys",
+            "metadata.interpreter metadata.kernelspec cell.metadata.pycharm",
+          ]
+  - repo: https://github.com/nbQA-dev/nbQA
+    rev: 1.7.0
+    hooks:
+      - id: nbqa-black
+      - id: nbqa-pyupgrade
+        args: ["--py37-plus"]
+      - id: nbqa-isort
+        args: ["--float-to-top"]

.style.yapf DELETED Viewed

@@ -1,5 +0,0 @@
-[style]
-based_on_style = pep8
-blank_line_before_nested_class_or_def = false
-spaces_before_comment = 2
-split_before_logical_operator = true

.vscode/settings.json CHANGED Viewed

@@ -1,18 +1,21 @@
 {
-    "python.linting.enabled": true,
-    "python.linting.flake8Enabled": true,
-    "python.linting.pylintEnabled": false,
-    "python.linting.lintOnSave": true,
-    "python.formatting.provider": "yapf",
-    "python.formatting.yapfArgs": [
-        "--style={based_on_style: pep8, indent_width: 4, blank_line_before_nested_class_or_def: false, spaces_before_comment: 2, split_before_logical_operator: true}"
-    ],
     "[python]": {
         "editor.formatOnType": true,
         "editor.codeActionsOnSave": {
             "source.organizeImports": true
         }
     },
     "editor.formatOnSave": true,
     "files.insertFinalNewline": true
 }

 {
     "[python]": {
+        "editor.defaultFormatter": "ms-python.black-formatter",
         "editor.formatOnType": true,
         "editor.codeActionsOnSave": {
             "source.organizeImports": true
         }
     },
+    "black-formatter.args": [
+        "--line-length=119"
+    ],
+    "isort.args": ["--profile", "black"],
+    "flake8.args": [
+        "--max-line-length=119"
+    ],
+    "ruff.args": [
+        "--line-length=119"
+    ],
     "editor.formatOnSave": true,
     "files.insertFinalNewline": true
 }

app.py CHANGED Viewed

@@ -13,83 +13,79 @@ from app_mlsd import create_demo as create_demo_mlsd
 from app_normal import create_demo as create_demo_normal
 from app_openpose import create_demo as create_demo_openpose
 from app_scribble import create_demo as create_demo_scribble
-from app_scribble_interactive import \
-    create_demo as create_demo_scribble_interactive
 from app_segmentation import create_demo as create_demo_segmentation
 from app_shuffle import create_demo as create_demo_shuffle
 from app_softedge import create_demo as create_demo_softedge
 from model import Model
-from settings import (ALLOW_CHANGING_BASE_MODEL, DEFAULT_MODEL_ID,
-                      SHOW_DUPLICATE_BUTTON)
-DESCRIPTION = '# ControlNet v1.1'
 if not torch.cuda.is_available():
-    DESCRIPTION += '\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>'
-model = Model(base_model_id=DEFAULT_MODEL_ID, task_name='Canny')
-with gr.Blocks(css='style.css') as demo:
     gr.Markdown(DESCRIPTION)
-    gr.DuplicateButton(value='Duplicate Space for private use',
-                       elem_id='duplicate-button',
-                       visible=SHOW_DUPLICATE_BUTTON)
     with gr.Tabs():
-        with gr.TabItem('Canny'):
             create_demo_canny(model.process_canny)
-        with gr.TabItem('MLSD'):
             create_demo_mlsd(model.process_mlsd)
-        with gr.TabItem('Scribble'):
             create_demo_scribble(model.process_scribble)
-        with gr.TabItem('Scribble Interactive'):
-            create_demo_scribble_interactive(
-                model.process_scribble_interactive)
-        with gr.TabItem('SoftEdge'):
             create_demo_softedge(model.process_softedge)
-        with gr.TabItem('OpenPose'):
             create_demo_openpose(model.process_openpose)
-        with gr.TabItem('Segmentation'):
             create_demo_segmentation(model.process_segmentation)
-        with gr.TabItem('Depth'):
             create_demo_depth(model.process_depth)
-        with gr.TabItem('Normal map'):
             create_demo_normal(model.process_normal)
-        with gr.TabItem('Lineart'):
             create_demo_lineart(model.process_lineart)
-        with gr.TabItem('Content Shuffle'):
             create_demo_shuffle(model.process_shuffle)
-        with gr.TabItem('Instruct Pix2Pix'):
             create_demo_ip2p(model.process_ip2p)
-    with gr.Accordion(label='Base model', open=False):
         with gr.Row():
             with gr.Column(scale=5):
-                current_base_model = gr.Text(label='Current base model')
             with gr.Column(scale=1):
-                check_base_model_button = gr.Button('Check current base model')
         with gr.Row():
             with gr.Column(scale=5):
                 new_base_model_id = gr.Text(
-                    label='New base model',
                     max_lines=1,
-                    placeholder='runwayml/stable-diffusion-v1-5',
-                    info=
-                    'The base model must be compatible with Stable Diffusion v1.5.',
-                    interactive=ALLOW_CHANGING_BASE_MODEL)
             with gr.Column(scale=1):
-                change_base_model_button = gr.Button(
-                    'Change base model', interactive=ALLOW_CHANGING_BASE_MODEL)
         if not ALLOW_CHANGING_BASE_MODEL:
             gr.Markdown(
-                '''The base model is not allowed to be changed in this Space so as not to slow down the demo, but it can be changed if you duplicate the Space.'''
             )
     check_base_model_button.click(
         fn=lambda: model.base_model_id,
         outputs=current_base_model,
         queue=False,
-        api_name='check_base_model',
     )
     new_base_model_id.submit(
         fn=model.set_base_model,

 from app_normal import create_demo as create_demo_normal
 from app_openpose import create_demo as create_demo_openpose
 from app_scribble import create_demo as create_demo_scribble
+from app_scribble_interactive import create_demo as create_demo_scribble_interactive
 from app_segmentation import create_demo as create_demo_segmentation
 from app_shuffle import create_demo as create_demo_shuffle
 from app_softedge import create_demo as create_demo_softedge
 from model import Model
+from settings import ALLOW_CHANGING_BASE_MODEL, DEFAULT_MODEL_ID, SHOW_DUPLICATE_BUTTON
+DESCRIPTION = "# ControlNet v1.1"
 if not torch.cuda.is_available():
+    DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
+model = Model(base_model_id=DEFAULT_MODEL_ID, task_name="Canny")
+with gr.Blocks(css="style.css") as demo:
     gr.Markdown(DESCRIPTION)
+    gr.DuplicateButton(
+        value="Duplicate Space for private use", elem_id="duplicate-button", visible=SHOW_DUPLICATE_BUTTON
+    )
     with gr.Tabs():
+        with gr.TabItem("Canny"):
             create_demo_canny(model.process_canny)
+        with gr.TabItem("MLSD"):
             create_demo_mlsd(model.process_mlsd)
+        with gr.TabItem("Scribble"):
             create_demo_scribble(model.process_scribble)
+        with gr.TabItem("Scribble Interactive"):
+            create_demo_scribble_interactive(model.process_scribble_interactive)
+        with gr.TabItem("SoftEdge"):
             create_demo_softedge(model.process_softedge)
+        with gr.TabItem("OpenPose"):
             create_demo_openpose(model.process_openpose)
+        with gr.TabItem("Segmentation"):
             create_demo_segmentation(model.process_segmentation)
+        with gr.TabItem("Depth"):
             create_demo_depth(model.process_depth)
+        with gr.TabItem("Normal map"):
             create_demo_normal(model.process_normal)
+        with gr.TabItem("Lineart"):
             create_demo_lineart(model.process_lineart)
+        with gr.TabItem("Content Shuffle"):
             create_demo_shuffle(model.process_shuffle)
+        with gr.TabItem("Instruct Pix2Pix"):
             create_demo_ip2p(model.process_ip2p)
+    with gr.Accordion(label="Base model", open=False):
         with gr.Row():
             with gr.Column(scale=5):
+                current_base_model = gr.Text(label="Current base model")
             with gr.Column(scale=1):
+                check_base_model_button = gr.Button("Check current base model")
         with gr.Row():
             with gr.Column(scale=5):
                 new_base_model_id = gr.Text(
+                    label="New base model",
                     max_lines=1,
+                    placeholder="runwayml/stable-diffusion-v1-5",
+                    info="The base model must be compatible with Stable Diffusion v1.5.",
+                    interactive=ALLOW_CHANGING_BASE_MODEL,
+                )
             with gr.Column(scale=1):
+                change_base_model_button = gr.Button("Change base model", interactive=ALLOW_CHANGING_BASE_MODEL)
         if not ALLOW_CHANGING_BASE_MODEL:
             gr.Markdown(
+                """The base model is not allowed to be changed in this Space so as not to slow down the demo, but it can be changed if you duplicate the Space."""
             )
     check_base_model_button.click(
         fn=lambda: model.base_model_id,
         outputs=current_base_model,
         queue=False,
+        api_name="check_base_model",
     )
     new_base_model_id.submit(
         fn=model.set_base_model,

app_canny.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,62 +17,36 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     canny_low_threshold = gr.Slider(
-                        label='Canny low threshold',
-                        minimum=1,
-                        maximum=255,
-                        value=100,
-                        step=1)
                     canny_high_threshold = gr.Slider(
-                        label='Canny high threshold',
-                        minimum=1,
-                        maximum=255,
-                        value=200,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -103,13 +82,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='canny',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='Canny')
     demo = create_demo(model.process_canny)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     canny_low_threshold = gr.Slider(
+                        label="Canny low threshold", minimum=1, maximum=255, value=100, step=1
+                    )
                     canny_high_threshold = gr.Slider(
+                        label="Canny high threshold", minimum=1, maximum=255, value=200, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="canny",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="Canny")
     demo = create_demo(model.process_canny)
     demo.queue().launch()

app_depth.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,61 +17,36 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
                     preprocessor_name = gr.Radio(
-                        label='Preprocessor',
-                        choices=['Midas', 'DPT', 'None'],
-                        type='value',
-                        value='DPT')
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=384,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -102,13 +82,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='depth',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='depth')
     demo = create_demo(model.process_depth)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
                     preprocessor_name = gr.Radio(
+                        label="Preprocessor", choices=["Midas", "DPT", "None"], type="value", value="DPT"
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=384, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="depth",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="depth")
     demo = create_demo(model.process_depth)
     demo.queue().launch()

app_ip2p.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,50 +17,30 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -89,13 +74,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='ip2p',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='ip2p')
     demo = create_demo(model.process_ip2p)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="ip2p",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="ip2p")
     demo = create_demo(model.process_ip2p)
     demo.queue().launch()

app_lineart.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,70 +17,46 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
                     preprocessor_name = gr.Radio(
-                        label='Preprocessor',
                         choices=[
-                            'Lineart',
-                            'Lineart coarse',
-                            'None',
-                            'Lineart (anime)',
-                            'None (anime)',
                         ],
-                        type='value',
-                        value='Lineart',
-                        info=
-                        'Note that "Lineart (anime)" and "None (anime)" are for anime base models like Anything-v3.'
                     )
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=512,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -111,13 +92,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='lineart',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='lineart')
     demo = create_demo(model.process_lineart)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
                     preprocessor_name = gr.Radio(
+                        label="Preprocessor",
                         choices=[
+                            "Lineart",
+                            "Lineart coarse",
+                            "None",
+                            "Lineart (anime)",
+                            "None (anime)",
                         ],
+                        type="value",
+                        value="Lineart",
+                        info='Note that "Lineart (anime)" and "None (anime)" are for anime base models like Anything-v3.',
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
                     )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=512, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="lineart",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="lineart")
     demo = create_demo(model.process_lineart)
     demo.queue().launch()

app_mlsd.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,68 +17,39 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=512,
-                        step=1)
                     mlsd_value_threshold = gr.Slider(
-                        label='Hough value threshold (MLSD)',
-                        minimum=0.01,
-                        maximum=2.0,
-                        value=0.1,
-                        step=0.01)
                     mlsd_distance_threshold = gr.Slider(
-                        label='Hough distance threshold (MLSD)',
-                        minimum=0.01,
-                        maximum=20.0,
-                        value=0.1,
-                        step=0.01)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -110,13 +86,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='mlsd',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='MLSD')
     demo = create_demo(model.process_mlsd)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=512, step=1
+                    )
                     mlsd_value_threshold = gr.Slider(
+                        label="Hough value threshold (MLSD)", minimum=0.01, maximum=2.0, value=0.1, step=0.01
+                    )
                     mlsd_distance_threshold = gr.Slider(
+                        label="Hough distance threshold (MLSD)", minimum=0.01, maximum=20.0, value=0.1, step=0.01
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="mlsd",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="MLSD")
     demo = create_demo(model.process_mlsd)
     demo.queue().launch()

app_normal.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,60 +17,36 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    preprocessor_name = gr.Radio(label='Preprocessor',
-                                                 choices=['NormalBae', 'None'],
-                                                 type='value',
-                                                 value='NormalBae')
-                    num_samples = gr.Slider(label='Images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=384,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -101,13 +82,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='normal',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='NormalBae')
     demo = create_demo(model.process_normal)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    preprocessor_name = gr.Radio(
+                        label="Preprocessor", choices=["NormalBae", "None"], type="value", value="NormalBae"
+                    )
+                    num_samples = gr.Slider(
+                        label="Images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=384, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="normal",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="NormalBae")
     demo = create_demo(model.process_normal)
     demo.queue().launch()

app_openpose.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,60 +17,36 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button(label='Run')
-                with gr.Accordion('Advanced options', open=False):
-                    preprocessor_name = gr.Radio(label='Preprocessor',
-                                                 choices=['Openpose', 'None'],
-                                                 type='value',
-                                                 value='Openpose')
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=512,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -101,13 +82,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='openpose',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='Openpose')
     demo = create_demo(model.process_openpose)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button(label="Run")
+                with gr.Accordion("Advanced options", open=False):
+                    preprocessor_name = gr.Radio(
+                        label="Preprocessor", choices=["Openpose", "None"], type="value", value="Openpose"
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=512, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="openpose",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="Openpose")
     demo = create_demo(model.process_openpose)
     demo.queue().launch()

app_scribble.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,61 +17,36 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
                     preprocessor_name = gr.Radio(
-                        label='Preprocessor',
-                        choices=['HED', 'PidiNet', 'None'],
-                        type='value',
-                        value='HED')
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=512,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -102,13 +82,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='scribble',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='scribble')
     demo = create_demo(model.process_scribble)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
                     preprocessor_name = gr.Radio(
+                        label="Preprocessor", choices=["HED", "PidiNet", "None"], type="value", value="HED"
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=512, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="scribble",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="scribble")
     demo = create_demo(model.process_scribble)
     demo.queue().launch()

app_scribble_interactive.py CHANGED Viewed

@@ -3,8 +3,13 @@
 import gradio as gr
 import numpy as np
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -16,62 +21,46 @@ def create_demo(process):
     with gr.Blocks() as demo:
         with gr.Row():
             with gr.Column():
-                canvas_width = gr.Slider(label='Canvas width',
-                                         minimum=256,
-                                         maximum=MAX_IMAGE_RESOLUTION,
-                                         value=DEFAULT_IMAGE_RESOLUTION,
-                                         step=1)
-                canvas_height = gr.Slider(label='Canvas height',
-                                          minimum=256,
-                                          maximum=MAX_IMAGE_RESOLUTION,
-                                          value=DEFAULT_IMAGE_RESOLUTION,
-                                          step=1)
-                create_button = gr.Button('Open drawing canvas!')
-                image = gr.Image(tool='sketch', brush_radius=10)
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         create_button.click(
             fn=create_canvas,
@@ -118,8 +107,9 @@ def create_demo(process):
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='scribble')
     demo = create_demo(model.process_scribble_interactive)
     demo.queue().launch()

 import gradio as gr
 import numpy as np
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
     with gr.Blocks() as demo:
         with gr.Row():
             with gr.Column():
+                canvas_width = gr.Slider(
+                    label="Canvas width",
+                    minimum=256,
+                    maximum=MAX_IMAGE_RESOLUTION,
+                    value=DEFAULT_IMAGE_RESOLUTION,
+                    step=1,
+                )
+                canvas_height = gr.Slider(
+                    label="Canvas height",
+                    minimum=256,
+                    maximum=MAX_IMAGE_RESOLUTION,
+                    value=DEFAULT_IMAGE_RESOLUTION,
+                    step=1,
+                )
+                create_button = gr.Button("Open drawing canvas!")
+                image = gr.Image(tool="sketch", brush_radius=10)
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         create_button.click(
             fn=create_canvas,
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="scribble")
     demo = create_demo(model.process_scribble_interactive)
     demo.queue().launch()

app_segmentation.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,60 +17,36 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    preprocessor_name = gr.Radio(label='Preprocessor',
-                                                 choices=['UPerNet', 'None'],
-                                                 type='value',
-                                                 value='UPerNet')
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=512,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -101,13 +82,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='segmentation',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='segmentation')
     demo = create_demo(model.process_segmentation)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    preprocessor_name = gr.Radio(
+                        label="Preprocessor", choices=["UPerNet", "None"], type="value", value="UPerNet"
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=512, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="segmentation",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="segmentation")
     demo = create_demo(model.process_segmentation)
     demo.queue().launch()

app_shuffle.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,55 +17,33 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
                     preprocessor_name = gr.Radio(
-                        label='Preprocessor',
-                        choices=['ContentShuffle', 'None'],
-                        type='value',
-                        value='ContentShuffle')
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -95,13 +78,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='content-shuffle',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='shuffle')
     demo = create_demo(model.process_shuffle)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
                     preprocessor_name = gr.Radio(
+                        label="Preprocessor", choices=["ContentShuffle", "None"], type="value", value="ContentShuffle"
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="content-shuffle",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="shuffle")
     demo = create_demo(model.process_shuffle)
     demo.queue().launch()

app_softedge.py CHANGED Viewed

@@ -2,8 +2,13 @@
 import gradio as gr
-from settings import (DEFAULT_IMAGE_RESOLUTION, DEFAULT_NUM_IMAGES,
-                      MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES, MAX_SEED)
 from utils import randomize_seed_fn
@@ -12,66 +17,45 @@ def create_demo(process):
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
-                prompt = gr.Textbox(label='Prompt')
-                run_button = gr.Button('Run')
-                with gr.Accordion('Advanced options', open=False):
-                    preprocessor_name = gr.Radio(label='Preprocessor',
-                                                 choices=[
-                                                     'HED',
-                                                     'PidiNet',
-                                                     'HED safe',
-                                                     'PidiNet safe',
-                                                     'None',
-                                                 ],
-                                                 type='value',
-                                                 value='PidiNet')
-                    num_samples = gr.Slider(label='Number of images',
-                                            minimum=1,
-                                            maximum=MAX_NUM_IMAGES,
-                                            value=DEFAULT_NUM_IMAGES,
-                                            step=1)
                     image_resolution = gr.Slider(
-                        label='Image resolution',
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
-                        step=256)
                     preprocess_resolution = gr.Slider(
-                        label='Preprocess resolution',
-                        minimum=128,
-                        maximum=512,
-                        value=512,
-                        step=1)
-                    num_steps = gr.Slider(label='Number of steps',
-                                          minimum=1,
-                                          maximum=100,
-                                          value=20,
-                                          step=1)
-                    guidance_scale = gr.Slider(label='Guidance scale',
-                                               minimum=0.1,
-                                               maximum=30.0,
-                                               value=9.0,
-                                               step=0.1)
-                    seed = gr.Slider(label='Seed',
-                                     minimum=0,
-                                     maximum=MAX_SEED,
-                                     step=1,
-                                     value=0)
-                    randomize_seed = gr.Checkbox(label='Randomize seed',
-                                                 value=True)
-                    a_prompt = gr.Textbox(
-                        label='Additional prompt',
-                        value='best quality, extremely detailed')
                     n_prompt = gr.Textbox(
-                        label='Negative prompt',
-                        value=
-                        'longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality'
                     )
             with gr.Column():
-                result = gr.Gallery(label='Output',
-                                    show_label=False,
-                                    columns=2,
-                                    object_fit='scale-down')
         inputs = [
             image,
             prompt,
@@ -107,13 +91,14 @@ def create_demo(process):
             fn=process,
             inputs=inputs,
             outputs=result,
-            api_name='softedge',
         )
     return demo
-if __name__ == '__main__':
     from model import Model
-    model = Model(task_name='softedge')
     demo = create_demo(model.process_softedge)
     demo.queue().launch()

 import gradio as gr
+from settings import (
+    DEFAULT_IMAGE_RESOLUTION,
+    DEFAULT_NUM_IMAGES,
+    MAX_IMAGE_RESOLUTION,
+    MAX_NUM_IMAGES,
+    MAX_SEED,
+)
 from utils import randomize_seed_fn
         with gr.Row():
             with gr.Column():
                 image = gr.Image()
+                prompt = gr.Textbox(label="Prompt")
+                run_button = gr.Button("Run")
+                with gr.Accordion("Advanced options", open=False):
+                    preprocessor_name = gr.Radio(
+                        label="Preprocessor",
+                        choices=[
+                            "HED",
+                            "PidiNet",
+                            "HED safe",
+                            "PidiNet safe",
+                            "None",
+                        ],
+                        type="value",
+                        value="PidiNet",
+                    )
+                    num_samples = gr.Slider(
+                        label="Number of images", minimum=1, maximum=MAX_NUM_IMAGES, value=DEFAULT_NUM_IMAGES, step=1
+                    )
                     image_resolution = gr.Slider(
+                        label="Image resolution",
                         minimum=256,
                         maximum=MAX_IMAGE_RESOLUTION,
                         value=DEFAULT_IMAGE_RESOLUTION,
+                        step=256,
+                    )
                     preprocess_resolution = gr.Slider(
+                        label="Preprocess resolution", minimum=128, maximum=512, value=512, step=1
+                    )
+                    num_steps = gr.Slider(label="Number of steps", minimum=1, maximum=100, value=20, step=1)
+                    guidance_scale = gr.Slider(label="Guidance scale", minimum=0.1, maximum=30.0, value=9.0, step=0.1)
+                    seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+                    randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    a_prompt = gr.Textbox(label="Additional prompt", value="best quality, extremely detailed")
                     n_prompt = gr.Textbox(
+                        label="Negative prompt",
+                        value="longbody, lowres, bad anatomy, bad hands, missing fingers, extra digit, fewer digits, cropped, worst quality, low quality",
                     )
             with gr.Column():
+                result = gr.Gallery(label="Output", show_label=False, columns=2, object_fit="scale-down")
         inputs = [
             image,
             prompt,
             fn=process,
             inputs=inputs,
             outputs=result,
+            api_name="softedge",
         )
     return demo
+if __name__ == "__main__":
     from model import Model
+    model = Model(task_name="softedge")
     demo = create_demo(model.process_softedge)
     demo.queue().launch()

depth_estimator.py CHANGED Viewed

@@ -8,17 +8,17 @@ from cv_utils import resize_image
 class DepthEstimator:
     def __init__(self):
-        self.model = pipeline('depth-estimation')
     def __call__(self, image: np.ndarray, **kwargs) -> PIL.Image.Image:
-        detect_resolution = kwargs.pop('detect_resolution', 512)
-        image_resolution = kwargs.pop('image_resolution', 512)
         image = np.array(image)
         image = HWC3(image)
         image = resize_image(image, resolution=detect_resolution)
         image = PIL.Image.fromarray(image)
         image = self.model(image)
-        image = image['depth']
         image = np.array(image)
         image = HWC3(image)
         image = resize_image(image, resolution=image_resolution)

 class DepthEstimator:
     def __init__(self):
+        self.model = pipeline("depth-estimation")
     def __call__(self, image: np.ndarray, **kwargs) -> PIL.Image.Image:
+        detect_resolution = kwargs.pop("detect_resolution", 512)
+        image_resolution = kwargs.pop("image_resolution", 512)
         image = np.array(image)
         image = HWC3(image)
         image = resize_image(image, resolution=detect_resolution)
         image = PIL.Image.fromarray(image)
         image = self.model(image)
+        image = image["depth"]
         image = np.array(image)
         image = HWC3(image)
         image = resize_image(image, resolution=image_resolution)

image_segmentor.py CHANGED Viewed

@@ -10,30 +10,24 @@ from cv_utils import resize_image
 class ImageSegmentor:
     def __init__(self):
-        self.image_processor = AutoImageProcessor.from_pretrained(
-            'openmmlab/upernet-convnext-small')
-        self.image_segmentor = UperNetForSemanticSegmentation.from_pretrained(
-            'openmmlab/upernet-convnext-small')
     @torch.inference_mode()
     def __call__(self, image: np.ndarray, **kwargs) -> PIL.Image.Image:
-        detect_resolution = kwargs.pop('detect_resolution', 512)
-        image_resolution = kwargs.pop('image_resolution', 512)
         image = HWC3(image)
         image = resize_image(image, resolution=detect_resolution)
         image = PIL.Image.fromarray(image)
-        pixel_values = self.image_processor(image,
-                                            return_tensors='pt').pixel_values
         outputs = self.image_segmentor(pixel_values)
-        seg = self.image_processor.post_process_semantic_segmentation(
-            outputs, target_sizes=[image.size[::-1]])[0]
         color_seg = np.zeros((seg.shape[0], seg.shape[1], 3), dtype=np.uint8)
         for label, color in enumerate(ade_palette()):
             color_seg[seg == label, :] = color
         color_seg = color_seg.astype(np.uint8)
-        color_seg = resize_image(color_seg,
-                                 resolution=image_resolution,
-                                 interpolation=cv2.INTER_NEAREST)
         return PIL.Image.fromarray(color_seg)

 class ImageSegmentor:
     def __init__(self):
+        self.image_processor = AutoImageProcessor.from_pretrained("openmmlab/upernet-convnext-small")
+        self.image_segmentor = UperNetForSemanticSegmentation.from_pretrained("openmmlab/upernet-convnext-small")
     @torch.inference_mode()
     def __call__(self, image: np.ndarray, **kwargs) -> PIL.Image.Image:
+        detect_resolution = kwargs.pop("detect_resolution", 512)
+        image_resolution = kwargs.pop("image_resolution", 512)
         image = HWC3(image)
         image = resize_image(image, resolution=detect_resolution)
         image = PIL.Image.fromarray(image)
+        pixel_values = self.image_processor(image, return_tensors="pt").pixel_values
         outputs = self.image_segmentor(pixel_values)
+        seg = self.image_processor.post_process_semantic_segmentation(outputs, target_sizes=[image.size[::-1]])[0]
         color_seg = np.zeros((seg.shape[0], seg.shape[1], 3), dtype=np.uint8)
         for label, color in enumerate(ade_palette()):
             color_seg[seg == label, :] = color
         color_seg = color_seg.astype(np.uint8)
+        color_seg = resize_image(color_seg, resolution=image_resolution, interpolation=cv2.INTER_NEAREST)
         return PIL.Image.fromarray(color_seg)

model.py CHANGED Viewed

@@ -6,28 +6,31 @@ import numpy as np
 import PIL.Image
 import torch
 from controlnet_aux.util import HWC3
-from diffusers import (ControlNetModel, DiffusionPipeline,
-                       StableDiffusionControlNetPipeline,
-                       UniPCMultistepScheduler)
 from cv_utils import resize_image
 from preprocessor import Preprocessor
 from settings import MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES
 CONTROLNET_MODEL_IDS = {
-    'Openpose': 'lllyasviel/control_v11p_sd15_openpose',
-    'Canny': 'lllyasviel/control_v11p_sd15_canny',
-    'MLSD': 'lllyasviel/control_v11p_sd15_mlsd',
-    'scribble': 'lllyasviel/control_v11p_sd15_scribble',
-    'softedge': 'lllyasviel/control_v11p_sd15_softedge',
-    'segmentation': 'lllyasviel/control_v11p_sd15_seg',
-    'depth': 'lllyasviel/control_v11f1p_sd15_depth',
-    'NormalBae': 'lllyasviel/control_v11p_sd15_normalbae',
-    'lineart': 'lllyasviel/control_v11p_sd15_lineart',
-    'lineart_anime': 'lllyasviel/control_v11p_sd15s2_lineart_anime',
-    'shuffle': 'lllyasviel/control_v11e_sd15_shuffle',
-    'ip2p': 'lllyasviel/control_v11e_sd15_ip2p',
-    'inpaint': 'lllyasviel/control_v11e_sd15_inpaint',
 }
@@ -37,31 +40,28 @@ def download_all_controlnet_weights() -> None:
 class Model:
-    def __init__(self,
-                 base_model_id: str = 'runwayml/stable-diffusion-v1-5',
-                 task_name: str = 'Canny'):
-        self.device = torch.device(
-            'cuda:0' if torch.cuda.is_available() else 'cpu')
-        self.base_model_id = ''
-        self.task_name = ''
         self.pipe = self.load_pipe(base_model_id, task_name)
         self.preprocessor = Preprocessor()
     def load_pipe(self, base_model_id: str, task_name) -> DiffusionPipeline:
-        if base_model_id == self.base_model_id and task_name == self.task_name and hasattr(
-                self, 'pipe') and self.pipe is not None:
             return self.pipe
         model_id = CONTROLNET_MODEL_IDS[task_name]
-        controlnet = ControlNetModel.from_pretrained(model_id,
-                                                     torch_dtype=torch.float16)
         pipe = StableDiffusionControlNetPipeline.from_pretrained(
-            base_model_id,
-            safety_checker=None,
-            controlnet=controlnet,
-            torch_dtype=torch.float16)
-        pipe.scheduler = UniPCMultistepScheduler.from_config(
-            pipe.scheduler.config)
-        if self.device.type == 'cuda':
             pipe.enable_xformers_memory_efficient_attention()
         pipe.to(self.device)
         torch.cuda.empty_cache()
@@ -85,13 +85,12 @@ class Model:
     def load_controlnet_weight(self, task_name: str) -> None:
         if task_name == self.task_name:
             return
-        if self.pipe is not None and hasattr(self.pipe, 'controlnet'):
             del self.pipe.controlnet
         torch.cuda.empty_cache()
         gc.collect()
         model_id = CONTROLNET_MODEL_IDS[task_name]
-        controlnet = ControlNetModel.from_pretrained(model_id,
-                                                     torch_dtype=torch.float16)
         controlnet.to(self.device)
         torch.cuda.empty_cache()
         gc.collect()
@@ -102,10 +101,10 @@ class Model:
         if not prompt:
             prompt = additional_prompt
         else:
-            prompt = f'{prompt}, {additional_prompt}'
         return prompt
-    @torch.autocast('cuda')
     def run_pipe(
         self,
         prompt: str,
@@ -117,13 +116,15 @@ class Model:
         seed: int,
     ) -> list[PIL.Image.Image]:
         generator = torch.Generator().manual_seed(seed)
-        return self.pipe(prompt=prompt,
-                         negative_prompt=negative_prompt,
-                         guidance_scale=guidance_scale,
-                         num_images_per_prompt=num_images,
-                         num_inference_steps=num_steps,
-                         generator=generator,
-                         image=control_image).images
     @torch.inference_mode()
     def process_canny(
@@ -147,13 +148,12 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        self.preprocessor.load('Canny')
-        control_image = self.preprocessor(image=image,
-                                          low_threshold=low_threshold,
-                                          high_threshold=high_threshold,
-                                          detect_resolution=image_resolution)
-        self.load_controlnet_weight('Canny')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -188,7 +188,7 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        self.preprocessor.load('MLSD')
         control_image = self.preprocessor(
             image=image,
             image_resolution=image_resolution,
@@ -196,7 +196,7 @@ class Model:
             thr_v=value_threshold,
             thr_d=distance_threshold,
         )
-        self.load_controlnet_weight('MLSD')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -230,11 +230,11 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
-        elif preprocessor_name == 'HED':
             self.preprocessor.load(preprocessor_name)
             control_image = self.preprocessor(
                 image=image,
@@ -242,7 +242,7 @@ class Model:
                 detect_resolution=preprocess_resolution,
                 scribble=False,
             )
-        elif preprocessor_name == 'PidiNet':
             self.preprocessor.load(preprocessor_name)
             control_image = self.preprocessor(
                 image=image,
@@ -250,7 +250,7 @@ class Model:
                 detect_resolution=preprocess_resolution,
                 safe=False,
             )
-        self.load_controlnet_weight('scribble')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -282,12 +282,12 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        image = image_and_mask['mask']
         image = HWC3(image)
         image = resize_image(image, resolution=image_resolution)
         control_image = PIL.Image.fromarray(image)
-        self.load_controlnet_weight('scribble')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -321,22 +321,22 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
-        elif preprocessor_name in ['HED', 'HED safe']:
-            safe = 'safe' in preprocessor_name
-            self.preprocessor.load('HED')
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
                 scribble=safe,
             )
-        elif preprocessor_name in ['PidiNet', 'PidiNet safe']:
-            safe = 'safe' in preprocessor_name
-            self.preprocessor.load('PidiNet')
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
@@ -345,7 +345,7 @@ class Model:
             )
         else:
             raise ValueError
-        self.load_controlnet_weight('softedge')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -379,19 +379,19 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
         else:
-            self.preprocessor.load('Openpose')
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
                 hand_and_face=True,
             )
-        self.load_controlnet_weight('Openpose')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -425,7 +425,7 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
@@ -436,7 +436,7 @@ class Model:
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
-        self.load_controlnet_weight('segmentation')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -470,7 +470,7 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
@@ -481,7 +481,7 @@ class Model:
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
-        self.load_controlnet_weight('depth')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -515,18 +515,18 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
         else:
-            self.preprocessor.load('NormalBae')
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
-        self.load_controlnet_weight('NormalBae')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -560,30 +560,30 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name in ['None', 'None (anime)']:
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
-        elif preprocessor_name in ['Lineart', 'Lineart coarse']:
-            coarse = 'coarse' in preprocessor_name
-            self.preprocessor.load('Lineart')
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
                 coarse=coarse,
             )
-        elif preprocessor_name == 'Lineart (anime)':
-            self.preprocessor.load('LineartAnime')
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
-        if 'anime' in preprocessor_name:
-            self.load_controlnet_weight('lineart_anime')
         else:
-            self.load_controlnet_weight('lineart')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -616,7 +616,7 @@ class Model:
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
-        if preprocessor_name == 'None':
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
@@ -626,7 +626,7 @@ class Model:
                 image=image,
                 image_resolution=image_resolution,
             )
-        self.load_controlnet_weight('shuffle')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
@@ -661,7 +661,7 @@ class Model:
         image = HWC3(image)
         image = resize_image(image, resolution=image_resolution)
         control_image = PIL.Image.fromarray(image)
-        self.load_controlnet_weight('ip2p')
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,

 import PIL.Image
 import torch
 from controlnet_aux.util import HWC3
+from diffusers import (
+    ControlNetModel,
+    DiffusionPipeline,
+    StableDiffusionControlNetPipeline,
+    UniPCMultistepScheduler,
+)
 from cv_utils import resize_image
 from preprocessor import Preprocessor
 from settings import MAX_IMAGE_RESOLUTION, MAX_NUM_IMAGES
 CONTROLNET_MODEL_IDS = {
+    "Openpose": "lllyasviel/control_v11p_sd15_openpose",
+    "Canny": "lllyasviel/control_v11p_sd15_canny",
+    "MLSD": "lllyasviel/control_v11p_sd15_mlsd",
+    "scribble": "lllyasviel/control_v11p_sd15_scribble",
+    "softedge": "lllyasviel/control_v11p_sd15_softedge",
+    "segmentation": "lllyasviel/control_v11p_sd15_seg",
+    "depth": "lllyasviel/control_v11f1p_sd15_depth",
+    "NormalBae": "lllyasviel/control_v11p_sd15_normalbae",
+    "lineart": "lllyasviel/control_v11p_sd15_lineart",
+    "lineart_anime": "lllyasviel/control_v11p_sd15s2_lineart_anime",
+    "shuffle": "lllyasviel/control_v11e_sd15_shuffle",
+    "ip2p": "lllyasviel/control_v11e_sd15_ip2p",
+    "inpaint": "lllyasviel/control_v11e_sd15_inpaint",
 }
 class Model:
+    def __init__(self, base_model_id: str = "runwayml/stable-diffusion-v1-5", task_name: str = "Canny"):
+        self.device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+        self.base_model_id = ""
+        self.task_name = ""
         self.pipe = self.load_pipe(base_model_id, task_name)
         self.preprocessor = Preprocessor()
     def load_pipe(self, base_model_id: str, task_name) -> DiffusionPipeline:
+        if (
+            base_model_id == self.base_model_id
+            and task_name == self.task_name
+            and hasattr(self, "pipe")
+            and self.pipe is not None
+        ):
             return self.pipe
         model_id = CONTROLNET_MODEL_IDS[task_name]
+        controlnet = ControlNetModel.from_pretrained(model_id, torch_dtype=torch.float16)
         pipe = StableDiffusionControlNetPipeline.from_pretrained(
+            base_model_id, safety_checker=None, controlnet=controlnet, torch_dtype=torch.float16
+        )
+        pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)
+        if self.device.type == "cuda":
             pipe.enable_xformers_memory_efficient_attention()
         pipe.to(self.device)
         torch.cuda.empty_cache()
     def load_controlnet_weight(self, task_name: str) -> None:
         if task_name == self.task_name:
             return
+        if self.pipe is not None and hasattr(self.pipe, "controlnet"):
             del self.pipe.controlnet
         torch.cuda.empty_cache()
         gc.collect()
         model_id = CONTROLNET_MODEL_IDS[task_name]
+        controlnet = ControlNetModel.from_pretrained(model_id, torch_dtype=torch.float16)
         controlnet.to(self.device)
         torch.cuda.empty_cache()
         gc.collect()
         if not prompt:
             prompt = additional_prompt
         else:
+            prompt = f"{prompt}, {additional_prompt}"
         return prompt
+    @torch.autocast("cuda")
     def run_pipe(
         self,
         prompt: str,
         seed: int,
     ) -> list[PIL.Image.Image]:
         generator = torch.Generator().manual_seed(seed)
+        return self.pipe(
+            prompt=prompt,
+            negative_prompt=negative_prompt,
+            guidance_scale=guidance_scale,
+            num_images_per_prompt=num_images,
+            num_inference_steps=num_steps,
+            generator=generator,
+            image=control_image,
+        ).images
     @torch.inference_mode()
     def process_canny(
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        self.preprocessor.load("Canny")
+        control_image = self.preprocessor(
+            image=image, low_threshold=low_threshold, high_threshold=high_threshold, detect_resolution=image_resolution
+        )
+        self.load_controlnet_weight("Canny")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        self.preprocessor.load("MLSD")
         control_image = self.preprocessor(
             image=image,
             image_resolution=image_resolution,
             thr_v=value_threshold,
             thr_d=distance_threshold,
         )
+        self.load_controlnet_weight("MLSD")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
+        elif preprocessor_name == "HED":
             self.preprocessor.load(preprocessor_name)
             control_image = self.preprocessor(
                 image=image,
                 detect_resolution=preprocess_resolution,
                 scribble=False,
             )
+        elif preprocessor_name == "PidiNet":
             self.preprocessor.load(preprocessor_name)
             control_image = self.preprocessor(
                 image=image,
                 detect_resolution=preprocess_resolution,
                 safe=False,
             )
+        self.load_controlnet_weight("scribble")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        image = image_and_mask["mask"]
         image = HWC3(image)
         image = resize_image(image, resolution=image_resolution)
         control_image = PIL.Image.fromarray(image)
+        self.load_controlnet_weight("scribble")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
+        elif preprocessor_name in ["HED", "HED safe"]:
+            safe = "safe" in preprocessor_name
+            self.preprocessor.load("HED")
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
                 scribble=safe,
             )
+        elif preprocessor_name in ["PidiNet", "PidiNet safe"]:
+            safe = "safe" in preprocessor_name
+            self.preprocessor.load("PidiNet")
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
             )
         else:
             raise ValueError
+        self.load_controlnet_weight("softedge")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
         else:
+            self.preprocessor.load("Openpose")
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
                 hand_and_face=True,
             )
+        self.load_controlnet_weight("Openpose")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
+        self.load_controlnet_weight("segmentation")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
+        self.load_controlnet_weight("depth")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
         else:
+            self.preprocessor.load("NormalBae")
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
+        self.load_controlnet_weight("NormalBae")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name in ["None", "None (anime)"]:
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
+        elif preprocessor_name in ["Lineart", "Lineart coarse"]:
+            coarse = "coarse" in preprocessor_name
+            self.preprocessor.load("Lineart")
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
                 coarse=coarse,
             )
+        elif preprocessor_name == "Lineart (anime)":
+            self.preprocessor.load("LineartAnime")
             control_image = self.preprocessor(
                 image=image,
                 image_resolution=image_resolution,
                 detect_resolution=preprocess_resolution,
             )
+        if "anime" in preprocessor_name:
+            self.load_controlnet_weight("lineart_anime")
         else:
+            self.load_controlnet_weight("lineart")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         if num_images > MAX_NUM_IMAGES:
             raise ValueError
+        if preprocessor_name == "None":
             image = HWC3(image)
             image = resize_image(image, resolution=image_resolution)
             control_image = PIL.Image.fromarray(image)
                 image=image,
                 image_resolution=image_resolution,
             )
+        self.load_controlnet_weight("shuffle")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,
         image = HWC3(image)
         image = resize_image(image, resolution=image_resolution)
         control_image = PIL.Image.fromarray(image)
+        self.load_controlnet_weight("ip2p")
         results = self.run_pipe(
             prompt=self.get_prompt(prompt, additional_prompt),
             negative_prompt=negative_prompt,

preprocessor.py CHANGED Viewed

@@ -3,10 +3,18 @@ import gc
 import numpy as np
 import PIL.Image
 import torch
-from controlnet_aux import (CannyDetector, ContentShuffleDetector, HEDdetector,
-                            LineartAnimeDetector, LineartDetector,
-                            MidasDetector, MLSDdetector, NormalBaeDetector,
-                            OpenposeDetector, PidiNetDetector)
 from controlnet_aux.util import HWC3
 from cv_utils import resize_image
@@ -15,38 +23,38 @@ from image_segmentor import ImageSegmentor
 class Preprocessor:
-    MODEL_ID = 'lllyasviel/Annotators'
     def __init__(self):
         self.model = None
-        self.name = ''
     def load(self, name: str) -> None:
         if name == self.name:
             return
-        if name == 'HED':
             self.model = HEDdetector.from_pretrained(self.MODEL_ID)
-        elif name == 'Midas':
             self.model = MidasDetector.from_pretrained(self.MODEL_ID)
-        elif name == 'MLSD':
             self.model = MLSDdetector.from_pretrained(self.MODEL_ID)
-        elif name == 'Openpose':
             self.model = OpenposeDetector.from_pretrained(self.MODEL_ID)
-        elif name == 'PidiNet':
             self.model = PidiNetDetector.from_pretrained(self.MODEL_ID)
-        elif name == 'NormalBae':
             self.model = NormalBaeDetector.from_pretrained(self.MODEL_ID)
-        elif name == 'Lineart':
             self.model = LineartDetector.from_pretrained(self.MODEL_ID)
-        elif name == 'LineartAnime':
             self.model = LineartAnimeDetector.from_pretrained(self.MODEL_ID)
-        elif name == 'Canny':
             self.model = CannyDetector()
-        elif name == 'ContentShuffle':
             self.model = ContentShuffleDetector()
-        elif name == 'DPT':
             self.model = DepthEstimator()
-        elif name == 'UPerNet':
             self.model = ImageSegmentor()
         else:
             raise ValueError
@@ -55,17 +63,17 @@ class Preprocessor:
         self.name = name
     def __call__(self, image: PIL.Image.Image, **kwargs) -> PIL.Image.Image:
-        if self.name == 'Canny':
-            if 'detect_resolution' in kwargs:
-                detect_resolution = kwargs.pop('detect_resolution')
                 image = np.array(image)
                 image = HWC3(image)
                 image = resize_image(image, resolution=detect_resolution)
             image = self.model(image, **kwargs)
             return PIL.Image.fromarray(image)
-        elif self.name == 'Midas':
-            detect_resolution = kwargs.pop('detect_resolution', 512)
-            image_resolution = kwargs.pop('image_resolution', 512)
             image = np.array(image)
             image = HWC3(image)
             image = resize_image(image, resolution=detect_resolution)

 import numpy as np
 import PIL.Image
 import torch
+from controlnet_aux import (
+    CannyDetector,
+    ContentShuffleDetector,
+    HEDdetector,
+    LineartAnimeDetector,
+    LineartDetector,
+    MidasDetector,
+    MLSDdetector,
+    NormalBaeDetector,
+    OpenposeDetector,
+    PidiNetDetector,
+)
 from controlnet_aux.util import HWC3
 from cv_utils import resize_image
 class Preprocessor:
+    MODEL_ID = "lllyasviel/Annotators"
     def __init__(self):
         self.model = None
+        self.name = ""
     def load(self, name: str) -> None:
         if name == self.name:
             return
+        if name == "HED":
             self.model = HEDdetector.from_pretrained(self.MODEL_ID)
+        elif name == "Midas":
             self.model = MidasDetector.from_pretrained(self.MODEL_ID)
+        elif name == "MLSD":
             self.model = MLSDdetector.from_pretrained(self.MODEL_ID)
+        elif name == "Openpose":
             self.model = OpenposeDetector.from_pretrained(self.MODEL_ID)
+        elif name == "PidiNet":
             self.model = PidiNetDetector.from_pretrained(self.MODEL_ID)
+        elif name == "NormalBae":
             self.model = NormalBaeDetector.from_pretrained(self.MODEL_ID)
+        elif name == "Lineart":
             self.model = LineartDetector.from_pretrained(self.MODEL_ID)
+        elif name == "LineartAnime":
             self.model = LineartAnimeDetector.from_pretrained(self.MODEL_ID)
+        elif name == "Canny":
             self.model = CannyDetector()
+        elif name == "ContentShuffle":
             self.model = ContentShuffleDetector()
+        elif name == "DPT":
             self.model = DepthEstimator()
+        elif name == "UPerNet":
             self.model = ImageSegmentor()
         else:
             raise ValueError
         self.name = name
     def __call__(self, image: PIL.Image.Image, **kwargs) -> PIL.Image.Image:
+        if self.name == "Canny":
+            if "detect_resolution" in kwargs:
+                detect_resolution = kwargs.pop("detect_resolution")
                 image = np.array(image)
                 image = HWC3(image)
                 image = resize_image(image, resolution=detect_resolution)
             image = self.model(image, **kwargs)
             return PIL.Image.fromarray(image)
+        elif self.name == "Midas":
+            detect_resolution = kwargs.pop("detect_resolution", 512)
+            image_resolution = kwargs.pop("image_resolution", 512)
             image = np.array(image)
             image = HWC3(image)
             image = resize_image(image, resolution=detect_resolution)

settings.py CHANGED Viewed

@@ -2,17 +2,14 @@ import os
 import numpy as np
-DEFAULT_MODEL_ID = os.getenv('DEFAULT_MODEL_ID',
-                             'runwayml/stable-diffusion-v1-5')
-MAX_NUM_IMAGES = int(os.getenv('MAX_NUM_IMAGES', '3'))
-DEFAULT_NUM_IMAGES = min(MAX_NUM_IMAGES,
-                         int(os.getenv('DEFAULT_NUM_IMAGES', '3')))
-MAX_IMAGE_RESOLUTION = int(os.getenv('MAX_IMAGE_RESOLUTION', '768'))
-DEFAULT_IMAGE_RESOLUTION = min(
-    MAX_IMAGE_RESOLUTION, int(os.getenv('DEFAULT_IMAGE_RESOLUTION', '768')))
-ALLOW_CHANGING_BASE_MODEL = os.getenv('SPACE_ID') != 'hysts/ControlNet-v1-1'
-SHOW_DUPLICATE_BUTTON = os.getenv('SHOW_DUPLICATE_BUTTON') == '1'
 MAX_SEED = np.iinfo(np.int32).max

 import numpy as np
+DEFAULT_MODEL_ID = os.getenv("DEFAULT_MODEL_ID", "runwayml/stable-diffusion-v1-5")
+MAX_NUM_IMAGES = int(os.getenv("MAX_NUM_IMAGES", "3"))
+DEFAULT_NUM_IMAGES = min(MAX_NUM_IMAGES, int(os.getenv("DEFAULT_NUM_IMAGES", "3")))
+MAX_IMAGE_RESOLUTION = int(os.getenv("MAX_IMAGE_RESOLUTION", "768"))
+DEFAULT_IMAGE_RESOLUTION = min(MAX_IMAGE_RESOLUTION, int(os.getenv("DEFAULT_IMAGE_RESOLUTION", "768")))
+ALLOW_CHANGING_BASE_MODEL = os.getenv("SPACE_ID") != "hysts/ControlNet-v1-1"
+SHOW_DUPLICATE_BUTTON = os.getenv("SHOW_DUPLICATE_BUTTON") == "1"
 MAX_SEED = np.iinfo(np.int32).max