bramw commited on
Commit
470d781
1 Parent(s): ad298de

Create working_app.py

Browse files
Files changed (1) hide show
  1. working_app.py +139 -0
working_app.py ADDED
@@ -0,0 +1,139 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import numpy as np
3
+ # from edict_functions import EDICT_editing
4
+ from PIL import Image
5
+ from utils import Endpoint, get_token
6
+ from io import BytesIO
7
+ import requests
8
+
9
+
10
+ endpoint = Endpoint()
11
+
12
+ def local_edict(x, source_text, edit_text,
13
+ edit_strength, guidance_scale,
14
+ steps=50, mix_weight=0.93, ):
15
+ x = Image.fromarray(x)
16
+ return_im = EDICT_editing(x,
17
+ source_text,
18
+ edit_text,
19
+ steps=steps,
20
+ mix_weight=mix_weight,
21
+ init_image_strength=edit_strength,
22
+ guidance_scale=guidance_scale
23
+ )[0]
24
+ return np.array(return_im)
25
+
26
+ def encode_image(image):
27
+ buffered = BytesIO()
28
+ image.save(buffered, format="JPEG", quality=95)
29
+ buffered.seek(0)
30
+
31
+ return buffered
32
+
33
+
34
+
35
+ def decode_image(img_obj):
36
+ img = Image.open(img_obj).convert("RGB")
37
+ return img
38
+
39
+ def edict(x, source_text, edit_text,
40
+ edit_strength, guidance_scale,
41
+ steps=50, mix_weight=0.93, ):
42
+
43
+ url = endpoint.url
44
+ url = url + "/api/edit"
45
+ headers = {### Misc.
46
+
47
+ "User-Agent": "EDICT HuggingFace Space",
48
+ "Auth-Token": get_token(),
49
+ }
50
+
51
+ data = {
52
+ "source_text": source_text,
53
+ "edit_text": edit_text,
54
+ "edit_strength": edit_strength,
55
+ "guidance_scale": guidance_scale,
56
+ }
57
+
58
+ image = encode_image(Image.fromarray(x))
59
+ files = {"image": image}
60
+
61
+ response = requests.post(url, data=data, files=files, headers=headers)
62
+
63
+ if response.status_code == 200:
64
+ return np.array(decode_image(BytesIO(response.content)))
65
+ else:
66
+ return "Error: " + response.text
67
+ # x = decode_image(response)
68
+ # return np.array(x)
69
+
70
+ examples = [
71
+ ['square_ims/american_gothic.jpg', 'A painting of two people frowning', 'A painting of two people smiling', 0.5, 3],
72
+ ['square_ims/colloseum.jpg', 'An old ruined building', 'A new modern office building', 0.8, 3],
73
+ ]
74
+
75
+
76
+ examples.append(['square_ims/scream.jpg', 'A painting of someone screaming', 'A painting of an alien', 0.5, 3])
77
+ examples.append(['square_ims/yosemite.jpg', 'Granite forest valley', 'Granite desert valley', 0.8, 3])
78
+ examples.append(['square_ims/einstein.jpg', 'Mouth open', 'Mouth closed', 0.8, 3])
79
+ examples.append(['square_ims/einstein.jpg', 'A man', 'A man in K.I.S.S. facepaint', 0.8, 3])
80
+ """
81
+ examples.extend([
82
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'A Chinese New Year cupcake', 0.8, 3],
83
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'A Union Jack cupcake', 0.8, 3],
84
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'A Nigerian flag cupcake', 0.8, 3],
85
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'A Santa Claus cupcake', 0.8, 3],
86
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'An Easter cupcake', 0.8, 3],
87
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'A hedgehog cupcake', 0.8, 3],
88
+ ['square_ims/imagenet_cake_2.jpg', 'A cupcake', 'A rose cupcake', 0.8, 3],
89
+ ])
90
+ """
91
+
92
+ for dog_i in [1, 2]:
93
+ for breed in ['Golden Retriever', 'Chihuahua', 'Dalmatian']:
94
+ examples.append([f'square_ims/imagenet_dog_{dog_i}.jpg', 'A dog', f'A {breed}', 0.8, 3])
95
+
96
+
97
+ description = 'A gradio demo for [EDICT](https://arxiv.org/abs/2211.12446) (CVPR23)'
98
+ # description = gr.Markdown(description)
99
+
100
+ article = """
101
+
102
+ ### Prompting Style
103
+
104
+ As with many text-to-image methods, the prompting style of EDICT can make a big difference. When in doubt, experiment! Some guidance:
105
+ * Parallel *Original Description* and *Edit Description* construction as much as possible. Inserting/editing single words often is enough to affect a change while maintaining a lot of the original structure
106
+ * Words that will affect the entire setting (e.g. "A photo of " vs. "A painting of") can make a big difference. Playing around with them can help a lot
107
+
108
+ ### Parameters
109
+ Both `edit_strength` and `guidance_scale` have similar properties qualitatively: the higher the value the more the image will change. We suggest
110
+ * Increasing/decreasing `edit_strength` first, particularly to alter/preserve more of the original structure/content
111
+ * Then changing `guidance_scale` to make the change in the edited region more or less pronounced.
112
+
113
+ Usually we find changing `edit_strength` to be enough, but feel free to play around (and report any interesting results)!
114
+
115
+ ### Misc.
116
+
117
+ Having difficulty coming up with a caption? Try [BLIP](https://huggingface.co/spaces/Salesforce/BLIP2) to automatically generate one!
118
+
119
+ As with most StableDiffusion approaches, faces/text are often problematic to render, especially if they're small. Having these in the foreground will help keep them cleaner.
120
+
121
+ A returned black image means that the [Safety Checker](https://huggingface.co/CompVis/stable-diffusion-safety-checker) triggered on the photo. This happens in odd cases sometimes (it often rejects
122
+ the huggingface logo or variations), but we need to keep it in for obvious reasons.
123
+ """
124
+ # article = gr.Markdown(description)
125
+
126
+ iface = gr.Interface(fn=edict, inputs=["image",
127
+ gr.Textbox(label="Original Description"),
128
+ gr.Textbox(label="Edit Description"),
129
+ # 50, # gr.Slider(5, 50, value=20, step=1),
130
+ # 0.93, # gr.Slider(0.5, 1, value=0.7, step=0.05),
131
+ gr.Slider(0.0, 1, value=0.8, step=0.05),
132
+ gr.Slider(0, 10, value=3, step=0.5),
133
+ ],
134
+ examples = examples,
135
+ outputs="image",
136
+ description=description,
137
+ article=article,
138
+ cache_examples=True)
139
+ iface.launch()