mishig HF Staff sayakpaul HF Staff commited on
Commit
ecd427f
·
0 Parent(s):

Duplicate from diffusers/controlnet-openpose

Browse files

Co-authored-by: Sayak Paul <sayakpaul@users.noreply.huggingface.co>

Files changed (5) hide show
  1. .gitattributes +34 -0
  2. README.md +13 -0
  3. app.py +137 -0
  4. requirements.txt +8 -0
  5. yoga1.jpeg +0 -0
.gitattributes ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: ControlNet Openpose
3
+ emoji: 😻
4
+ colorFrom: green
5
+ colorTo: gray
6
+ sdk: gradio
7
+ sdk_version: 3.23.0
8
+ app_file: app.py
9
+ pinned: false
10
+ duplicated_from: diffusers/controlnet-openpose
11
+ ---
12
+
13
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
app.py ADDED
@@ -0,0 +1,137 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from controlnet_aux import OpenposeDetector
2
+ from diffusers import StableDiffusionControlNetPipeline, ControlNetModel
3
+ from diffusers import UniPCMultistepScheduler
4
+ import gradio as gr
5
+ import torch
6
+ import base64
7
+ from io import BytesIO
8
+ from PIL import Image
9
+ # live conditioning
10
+ canvas_html = "<pose-canvas id='canvas-root' style='display:flex;max-width: 500px;margin: 0 auto;'></pose-canvas>"
11
+ load_js = """
12
+ async () => {
13
+ const url = "https://huggingface.co/datasets/radames/gradio-components/raw/main/pose-gradio.js"
14
+ fetch(url)
15
+ .then(res => res.text())
16
+ .then(text => {
17
+ const script = document.createElement('script');
18
+ script.type = "module"
19
+ script.src = URL.createObjectURL(new Blob([text], { type: 'application/javascript' }));
20
+ document.head.appendChild(script);
21
+ });
22
+ }
23
+ """
24
+ get_js_image = """
25
+ async (image_in_img, prompt, image_file_live_opt, live_conditioning) => {
26
+ const canvasEl = document.getElementById("canvas-root");
27
+ const data = canvasEl? canvasEl._data : null;
28
+ return [image_in_img, prompt, image_file_live_opt, data]
29
+ }
30
+ """
31
+
32
+ # Constants
33
+ low_threshold = 100
34
+ high_threshold = 200
35
+
36
+ # Models
37
+ pose_model = OpenposeDetector.from_pretrained("lllyasviel/ControlNet")
38
+ controlnet = ControlNetModel.from_pretrained(
39
+ "lllyasviel/sd-controlnet-openpose", torch_dtype=torch.float16
40
+ )
41
+ pipe = StableDiffusionControlNetPipeline.from_pretrained(
42
+ "runwayml/stable-diffusion-v1-5", controlnet=controlnet, safety_checker=None, torch_dtype=torch.float16
43
+ )
44
+ pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)
45
+
46
+ # This command loads the individual model components on GPU on-demand. So, we don't
47
+ # need to explicitly call pipe.to("cuda").
48
+ pipe.enable_model_cpu_offload()
49
+
50
+ # xformers
51
+ pipe.enable_xformers_memory_efficient_attention()
52
+
53
+ # Generator seed,
54
+ generator = torch.manual_seed(0)
55
+
56
+
57
+ def get_pose(image):
58
+ return pose_model(image)
59
+
60
+
61
+ def generate_images(image, prompt, image_file_live_opt='file', live_conditioning=None):
62
+ if image is None and 'image' not in live_conditioning:
63
+ raise gr.Error("Please provide an image")
64
+ try:
65
+ if image_file_live_opt == 'file':
66
+ pose = get_pose(image)
67
+ elif image_file_live_opt == 'webcam':
68
+ base64_img = live_conditioning['image']
69
+ image_data = base64.b64decode(base64_img.split(',')[1])
70
+ pose = Image.open(BytesIO(image_data)).convert(
71
+ 'RGB').resize((512, 512))
72
+ output = pipe(
73
+ prompt,
74
+ pose,
75
+ generator=generator,
76
+ num_images_per_prompt=3,
77
+ num_inference_steps=20,
78
+ )
79
+ all_outputs = []
80
+ all_outputs.append(pose)
81
+ for image in output.images:
82
+ all_outputs.append(image)
83
+ return all_outputs
84
+ except Exception as e:
85
+ raise gr.Error(str(e))
86
+
87
+
88
+ def toggle(choice):
89
+ if choice == "file":
90
+ return gr.update(visible=True, value=None), gr.update(visible=False, value=None)
91
+ elif choice == "webcam":
92
+ return gr.update(visible=False, value=None), gr.update(visible=True, value=canvas_html)
93
+
94
+
95
+ with gr.Blocks() as blocks:
96
+ gr.Markdown("""
97
+ ## Generate controlled outputs with ControlNet and Stable Diffusion
98
+ This Space uses pose estimated lines as the additional conditioning
99
+ [Check out our blog to see how this was done (and train your own controlnet)](https://huggingface.co/blog/train-your-controlnet)
100
+ """)
101
+ with gr.Row():
102
+ live_conditioning = gr.JSON(value={}, visible=False)
103
+ with gr.Column():
104
+ image_file_live_opt = gr.Radio(["file", "webcam"], value="file",
105
+ label="How would you like to upload your image?")
106
+ image_in_img = gr.Image(source="upload", visible=True, type="pil")
107
+ canvas = gr.HTML(None, elem_id="canvas_html", visible=False)
108
+
109
+ image_file_live_opt.change(fn=toggle,
110
+ inputs=[image_file_live_opt],
111
+ outputs=[image_in_img, canvas],
112
+ queue=False)
113
+ prompt = gr.Textbox(
114
+ label="Enter your prompt",
115
+ max_lines=1,
116
+ placeholder="best quality, extremely detailed",
117
+ )
118
+ run_button = gr.Button("Generate")
119
+ with gr.Column():
120
+ gallery = gr.Gallery().style(grid=[2], height="auto")
121
+ run_button.click(fn=generate_images,
122
+ inputs=[image_in_img, prompt,
123
+ image_file_live_opt, live_conditioning],
124
+ outputs=[gallery],
125
+ _js=get_js_image)
126
+ blocks.load(None, None, None, _js=load_js)
127
+
128
+ gr.Examples(fn=generate_images,
129
+ examples=[
130
+ ["./yoga1.jpeg",
131
+ "best quality, extremely detailed"]
132
+ ],
133
+ inputs=[image_in_img, prompt],
134
+ outputs=[gallery],
135
+ cache_examples=True)
136
+
137
+ blocks.launch(debug=True)
requirements.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ git+https://github.com/huggingface/diffusers.git
2
+ transformers
3
+ git+https://github.com/huggingface/accelerate
4
+ torch==1.13.1
5
+ numpy
6
+ controlnet_aux
7
+ xformers==0.0.16
8
+ triton
yoga1.jpeg ADDED