Create utils.py
Browse files
utils.py
ADDED
@@ -0,0 +1,424 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import seaborn as sns
|
2 |
+
from PIL import Image, ImageDraw, ImageFont
|
3 |
+
import matplotlib.font_manager
|
4 |
+
import spacy
|
5 |
+
import re
|
6 |
+
import base64
|
7 |
+
import time
|
8 |
+
import re
|
9 |
+
from PIL import Image
|
10 |
+
import base64
|
11 |
+
import hashlib
|
12 |
+
import os
|
13 |
+
|
14 |
+
nlp = spacy.load("en_core_web_sm-3.6.0")
|
15 |
+
|
16 |
+
def process_image_without_resize(image_prompt):
|
17 |
+
image = Image.open(image_prompt)
|
18 |
+
print(f"height:{image.height}, width:{image.width}")
|
19 |
+
timestamp = time.time()
|
20 |
+
file_ext = os.path.splitext(image_prompt)[1]
|
21 |
+
filename = f"examples/{timestamp}{file_ext}"
|
22 |
+
filename_grounding = f"examples/{timestamp}_grounding{file_ext}"
|
23 |
+
image.save(filename)
|
24 |
+
print(f"temporal filename {filename}")
|
25 |
+
with open(filename, "rb") as image_file:
|
26 |
+
bytes = base64.b64encode(image_file.read())
|
27 |
+
encoded_img = str(bytes, encoding='utf-8')
|
28 |
+
image_hash = hashlib.sha256(bytes).hexdigest()
|
29 |
+
os.remove(filename)
|
30 |
+
return image, encoded_img, image_hash, filename_grounding
|
31 |
+
|
32 |
+
|
33 |
+
def is_chinese(text):
|
34 |
+
zh_pattern = re.compile(u'[\u4e00-\u9fa5]+')
|
35 |
+
return zh_pattern.search(text)
|
36 |
+
|
37 |
+
|
38 |
+
def draw_boxes(image, boxes, texts, output_fn='output.png'):
|
39 |
+
box_width = 5
|
40 |
+
color_palette = sns.color_palette("husl", len(boxes))
|
41 |
+
colors = [(int(r*255), int(g*255), int(b*255)) for r, g, b in color_palette]
|
42 |
+
|
43 |
+
width, height = image.size
|
44 |
+
absolute_boxes = [[(int(box[0] * width), int(box[1] * height), int(box[2] * width), int(box[3] * height)) for box in b] for b in boxes]
|
45 |
+
|
46 |
+
overlay = Image.new('RGBA', image.size, (255, 255, 255, 0))
|
47 |
+
draw = ImageDraw.Draw(overlay)
|
48 |
+
font_path = sorted(matplotlib.font_manager.findSystemFonts(fontpaths=None, fontext='ttf'))[0]
|
49 |
+
font = ImageFont.truetype(font_path, size=26)
|
50 |
+
|
51 |
+
for box, text, color in zip(absolute_boxes, texts, colors):
|
52 |
+
for b in box:
|
53 |
+
draw.rectangle(b, outline=color, width=box_width)
|
54 |
+
if not text:
|
55 |
+
continue
|
56 |
+
splited_text = text.split('\n')
|
57 |
+
num_lines = len(splited_text)
|
58 |
+
text_width, text_height = font.getbbox(splited_text[0])[-2:]
|
59 |
+
y_start = b[3] - text_height * num_lines - box_width
|
60 |
+
if b[2] - b[0] < 100 or b[3] - b[1] < 100:
|
61 |
+
y_start = b[3]
|
62 |
+
for i, line in enumerate(splited_text):
|
63 |
+
text_width, text_height = font.getbbox(line)[-2:]
|
64 |
+
x = b[0] + box_width
|
65 |
+
y = y_start + text_height * i
|
66 |
+
draw.rectangle([x, y, x+text_width, y+text_height], fill=(128, 128, 128, 160))
|
67 |
+
draw.text((x, y), line, font=font, fill=(255, 255, 255))
|
68 |
+
img_with_overlay = Image.alpha_composite(image.convert('RGBA'), overlay).convert('RGB')
|
69 |
+
img_with_overlay.save(output_fn)
|
70 |
+
|
71 |
+
def boxstr_to_boxes(box_str):
|
72 |
+
boxes = [[int(y)/1000 for y in x.split(',')] for x in box_str.split(';') if x.replace(',', '').isdigit()]
|
73 |
+
return boxes
|
74 |
+
|
75 |
+
def text_to_dict(text):
|
76 |
+
doc = nlp(text)
|
77 |
+
|
78 |
+
box_matches = list(re.finditer(r'\[\[([^\]]+)\]\]', text))
|
79 |
+
box_positions = [match.start() for match in box_matches]
|
80 |
+
|
81 |
+
noun_phrases = []
|
82 |
+
boxes = []
|
83 |
+
|
84 |
+
for match, box_position in zip(box_matches, box_positions):
|
85 |
+
nearest_np_start = max([0] + [chunk.start_char for chunk in doc.noun_chunks if chunk.end_char <= box_position])
|
86 |
+
noun_phrase = text[nearest_np_start:box_position].strip()
|
87 |
+
if noun_phrase and noun_phrase[-1] == '?':
|
88 |
+
noun_phrase = text[:box_position].strip()
|
89 |
+
box_string = match.group(1)
|
90 |
+
|
91 |
+
noun_phrases.append(noun_phrase)
|
92 |
+
boxes.append(boxstr_to_boxes(box_string))
|
93 |
+
|
94 |
+
pairs = []
|
95 |
+
for noun_phrase, box_string in zip(noun_phrases, boxes):
|
96 |
+
pairs.append((noun_phrase.lower(), box_string))
|
97 |
+
return dict(pairs)
|
98 |
+
|
99 |
+
def parse_response(img, response, output_fn='output.png'):
|
100 |
+
img = img.convert('RGB')
|
101 |
+
width, height = img.size
|
102 |
+
ratio = min(1920 / width, 1080 / height)
|
103 |
+
new_width = int(width * ratio)
|
104 |
+
new_height = int(height * ratio)
|
105 |
+
new_img = img.resize((new_width, new_height), Image.LANCZOS)
|
106 |
+
pattern = r"\[\[(.*?)\]\]"
|
107 |
+
positions = re.findall(pattern, response)
|
108 |
+
boxes = [[[int(y) for y in x.split(',')] for x in pos.split(';') if x.replace(',', '').isdigit()] for pos in positions]
|
109 |
+
dic = text_to_dict(response)
|
110 |
+
if not dic:
|
111 |
+
texts = []
|
112 |
+
boxes = []
|
113 |
+
else:
|
114 |
+
texts, boxes = zip(*dic.items())
|
115 |
+
draw_boxes(new_img, boxes, texts, output_fn=output_fn)
|
116 |
+
|
117 |
+
def postprocess_text(template, text):
|
118 |
+
quoted_text = f'"{text.strip()}"'
|
119 |
+
return template.replace("<TASK>", quoted_text).strip() if template != "" else text.strip()
|
120 |
+
|
121 |
+
|
122 |
+
# The templates is for CogAgent_Agent Template
|
123 |
+
templates_agent_cogagent = [
|
124 |
+
"do not use template",
|
125 |
+
"Can you advise me on how to <TASK>?",
|
126 |
+
"I'm looking for guidance on how to <TASK>.",
|
127 |
+
"What steps do I need to take to <TASK>?",
|
128 |
+
"Could you provide instructions for <TASK>?",
|
129 |
+
"I'm wondering what the process is for <TASK>.",
|
130 |
+
"How can I go about <TASK>?",
|
131 |
+
"I need assistance with planning to <TASK>.",
|
132 |
+
"Do you have any recommendations for <TASK>?",
|
133 |
+
"Please share some tips for <TASK>.",
|
134 |
+
"I'd like to know the best way to <TASK>.",
|
135 |
+
"What's the most effective way to <TASK>?",
|
136 |
+
"I'm seeking advice on accomplishing <TASK>.",
|
137 |
+
"Could you guide me through the steps to <TASK>?",
|
138 |
+
"I'm unsure how to start with <TASK>.",
|
139 |
+
"Is there a strategy for successfully <TASK>?",
|
140 |
+
"What's the proper procedure for <TASK>?",
|
141 |
+
"How should I prepare for <TASK>?",
|
142 |
+
"I'm not sure where to begin with <TASK>.",
|
143 |
+
"I need some insights on <TASK>.",
|
144 |
+
"Can you explain how to tackle <TASK>?",
|
145 |
+
"I'm interested in the process of <TASK>.",
|
146 |
+
"Could you enlighten me on <TASK>?",
|
147 |
+
"What are the recommended steps for <TASK>?",
|
148 |
+
"Is there a preferred method for <TASK>?",
|
149 |
+
"I'd appreciate your advice on <TASK>.",
|
150 |
+
"Can you shed light on <TASK>?",
|
151 |
+
"What would be the best approach to <TASK>?",
|
152 |
+
"How do I get started with <TASK>?",
|
153 |
+
"I'm inquiring about the procedure for <TASK>.",
|
154 |
+
"Could you share your expertise on <TASK>?",
|
155 |
+
"I'd like some guidance on <TASK>.",
|
156 |
+
"What's your recommendation for <TASK>?",
|
157 |
+
"I'm seeking your input on how to <TASK>.",
|
158 |
+
"Can you provide some insights into <TASK>?",
|
159 |
+
"How can I successfully accomplish <TASK>?",
|
160 |
+
"What steps are involved in <TASK>?",
|
161 |
+
"I'm curious about the best way to <TASK>.",
|
162 |
+
"Could you show me the ropes for <TASK>?",
|
163 |
+
"I need to know how to go about <TASK>.",
|
164 |
+
"What are the essential steps for <TASK>?",
|
165 |
+
"Is there a specific method for <TASK>?",
|
166 |
+
"I'd like to get some advice on <TASK>.",
|
167 |
+
"Can you explain the process of <TASK>?",
|
168 |
+
"I'm looking for guidance on how to approach <TASK>.",
|
169 |
+
"What's the proper way to handle <TASK>?",
|
170 |
+
"How should I proceed with <TASK>?",
|
171 |
+
"I'm interested in your expertise on <TASK>.",
|
172 |
+
"Could you walk me through the steps for <TASK>?",
|
173 |
+
"I'm not sure where to begin when it comes to <TASK>.",
|
174 |
+
"What should I prioritize when doing <TASK>?",
|
175 |
+
"How can I ensure success with <TASK>?",
|
176 |
+
"I'd appreciate some tips on <TASK>.",
|
177 |
+
"Can you provide a roadmap for <TASK>?",
|
178 |
+
"What's the recommended course of action for <TASK>?",
|
179 |
+
"I'm seeking your guidance on <TASK>.",
|
180 |
+
"Could you offer some suggestions for <TASK>?",
|
181 |
+
"I'd like to know the steps to take for <TASK>.",
|
182 |
+
"What's the most effective way to achieve <TASK>?",
|
183 |
+
"How can I make the most of <TASK>?",
|
184 |
+
"I'm wondering about the best approach to <TASK>.",
|
185 |
+
"Can you share your insights on <TASK>?",
|
186 |
+
"What steps should I follow to complete <TASK>?",
|
187 |
+
"I'm looking for advice on <TASK>.",
|
188 |
+
"What's the strategy for successfully completing <TASK>?",
|
189 |
+
"How should I prepare myself for <TASK>?",
|
190 |
+
"I'm not sure where to start with <TASK>.",
|
191 |
+
"What's the procedure for <TASK>?",
|
192 |
+
"Could you provide some guidance on <TASK>?",
|
193 |
+
"I'd like to get some tips on how to <TASK>.",
|
194 |
+
"Can you explain how to tackle <TASK> step by step?",
|
195 |
+
"I'm interested in understanding the process of <TASK>.",
|
196 |
+
"What are the key steps to <TASK>?",
|
197 |
+
"Is there a specific method that works for <TASK>?",
|
198 |
+
"I'd appreciate your advice on successfully completing <TASK>.",
|
199 |
+
"Can you shed light on the best way to <TASK>?",
|
200 |
+
"What would you recommend as the first step to <TASK>?",
|
201 |
+
"How do I initiate <TASK>?",
|
202 |
+
"I'm inquiring about the recommended steps for <TASK>.",
|
203 |
+
"Could you share some insights into <TASK>?",
|
204 |
+
"I'm seeking your expertise on <TASK>.",
|
205 |
+
"What's your recommended approach for <TASK>?",
|
206 |
+
"I'd like some guidance on where to start with <TASK>.",
|
207 |
+
"Can you provide recommendations for <TASK>?",
|
208 |
+
"What's your advice for someone looking to <TASK>?",
|
209 |
+
"I'm seeking your input on the process of <TASK>.",
|
210 |
+
"How can I achieve success with <TASK>?",
|
211 |
+
"What's the best way to navigate <TASK>?",
|
212 |
+
"I'm curious about the steps required for <TASK>.",
|
213 |
+
"Could you show me the proper way to <TASK>?",
|
214 |
+
"I need to know the necessary steps for <TASK>.",
|
215 |
+
"What's the most efficient method for <TASK>?",
|
216 |
+
"I'd appreciate your guidance on <TASK>.",
|
217 |
+
"Can you explain the steps involved in <TASK>?",
|
218 |
+
"I'm looking for recommendations on how to approach <TASK>.",
|
219 |
+
"What's the right way to handle <TASK>?",
|
220 |
+
"How should I manage <TASK>?",
|
221 |
+
"I'm interested in your insights on <TASK>.",
|
222 |
+
"Could you provide a step-by-step guide for <TASK>?",
|
223 |
+
"I'm not sure how to start when it comes to <TASK>.",
|
224 |
+
"What are the key factors to consider for <TASK>?",
|
225 |
+
"How can I ensure a successful outcome with <TASK>?",
|
226 |
+
"I'd like some tips and tricks for <TASK>.",
|
227 |
+
"Can you offer a roadmap for accomplishing <TASK>?",
|
228 |
+
"What's the preferred course of action for <TASK>?",
|
229 |
+
"I'm seeking your expert advice on <TASK>.",
|
230 |
+
"Could you suggest some best practices for <TASK>?",
|
231 |
+
"I'd like to understand the necessary steps to complete <TASK>.",
|
232 |
+
"What's the most effective strategy for <TASK>?",
|
233 |
+
]
|
234 |
+
|
235 |
+
template_grounding_cogvlm = [
|
236 |
+
"Where is <TASK>?",
|
237 |
+
"Where is <TASK> in the image?",
|
238 |
+
"Where is <TASK>? answer in [[x0,y0,x1,y1]] format.",
|
239 |
+
"Can you point out <TASK> in the image and provide the bounding boxes of its location?",
|
240 |
+
"Help me to locate <TASK> in and give me its bounding boxes, please.",
|
241 |
+
"In the given, could you find and tell me the bounding boxes of <TASK>?",
|
242 |
+
"Guide me to the location of <TASK> within the image by providing its bounding boxes.",
|
243 |
+
"I'd like to know the exact bounding boxes of <TASK> in the photo.",
|
244 |
+
"Would you kindly provide the bounding boxes of <TASK> located in the picture?",
|
245 |
+
"Can you find <TASK> in and give me the bounding boxes of where it is located?",
|
246 |
+
"I'm trying to locate <TASK> in. Can you determine its bounding boxes for me?",
|
247 |
+
"What are the bounding boxes of <TASK> in the image?",
|
248 |
+
"Can you disclose the position of <TASK> in the photograph by stating its bounding boxes?",
|
249 |
+
"In, could you let me know the location of <TASK> in the form of bounding boxes?",
|
250 |
+
"I need the bounding boxes of <TASK> in, can you please assist me with that?",
|
251 |
+
"Where in is <TASK> located? Provide me with its bounding boxes, please.",
|
252 |
+
"May I have the bounding boxes of <TASK>?",
|
253 |
+
"In the photograph, could you pinpoint the location of <TASK> and tell me its bounding boxes?",
|
254 |
+
"Can you please search and find <TASK> in, then let me know its bounding boxes?",
|
255 |
+
"Please, point out the position of <TASK> in the image by giving its bounding boxes.",
|
256 |
+
"What are the exact bounding boxes of <TASK> in the provided picture?",
|
257 |
+
"Detect the location of <TASK> in and share the bounding boxes with me, please.",
|
258 |
+
"In the picture, I'd like you to locate <TASK> and provide its coordinates.",
|
259 |
+
"Please indicate the location of <TASK> in the photo by giving bounding boxes.",
|
260 |
+
"Find <TASK> in and share its coordinates with me.",
|
261 |
+
"Could you please help me find the bounding boxes of <TASK> in the image?",
|
262 |
+
"I am looking for the position of <TASK> in. Can you provide its bounding boxes?",
|
263 |
+
"In the image, can you locate <TASK> and let me know its coordinates?",
|
264 |
+
"I'd appreciate if you could find and tell me the bounding boxes of <TASK>.",
|
265 |
+
"In, I need the bounding box bounding boxes of <TASK>.",
|
266 |
+
"Point me to the location of <TASK> in the picture by providing its bounding boxes.",
|
267 |
+
"Could you trace <TASK> in and tell me its bounding boxes?",
|
268 |
+
"Can you assist me in locating <TASK> in, and then provide its bounding boxes?",
|
269 |
+
"I'm curious, what are the bounding boxes of <TASK> in the photo?",
|
270 |
+
"Kindly share the bounding boxes of <TASK> located in the image.",
|
271 |
+
"I would like to find <TASK> in. Can you give me its bounding boxes?",
|
272 |
+
"Can you spot <TASK> in and disclose its bounding boxes to me?",
|
273 |
+
"Please, reveal the location of <TASK> in the provided photograph as coordinates.",
|
274 |
+
"Help me locate and determine the bounding boxes of <TASK>.",
|
275 |
+
"I request the bounding boxes of <TASK> in the image.",
|
276 |
+
"In the given, can you find <TASK> and tell me its bounding boxes?",
|
277 |
+
"I need to know the position of <TASK> in as bounding boxes.",
|
278 |
+
"Locate <TASK> in and provide its bounding boxes, please.",
|
279 |
+
"Assist me in finding <TASK> in the photo and provide the bounding box bounding boxes.",
|
280 |
+
"In, can you guide me to the location of <TASK> by providing bounding boxes?",
|
281 |
+
"I'd like the bounding boxes of <TASK> as it appears in the image.",
|
282 |
+
"What location does <TASK> hold in the picture? Inform me of its bounding boxes.",
|
283 |
+
"Identify the position of <TASK> in and share its bounding boxes.",
|
284 |
+
"I'd like to request the bounding boxes of <TASK> within the photo.",
|
285 |
+
"How can I locate <TASK> in the image? Please provide the bounding boxes.",
|
286 |
+
"I am interested in knowing the bounding boxes of <TASK> in the picture.",
|
287 |
+
"Assist me in locating the position of <TASK> in the photograph and its bounding box bounding boxes.",
|
288 |
+
"In the image, I need to find <TASK> and know its bounding boxes. Can you please help?"
|
289 |
+
"Can you give me a description of the region <TASK> in image?",
|
290 |
+
"In the provided image, would you mind describing the selected area <TASK>?",
|
291 |
+
"I need details about the area <TASK> located within image.",
|
292 |
+
"Could you please share some information on the region <TASK> in this photograph?",
|
293 |
+
"Describe what's happening within the coordinates <TASK> of the given image.",
|
294 |
+
"What can you tell me about the selected region <TASK> in the photo?",
|
295 |
+
"Please, can you help me understand what's inside the region <TASK> in image?",
|
296 |
+
"Give me a comprehensive description of the specified area <TASK> in the picture.",
|
297 |
+
"I'm curious about the area <TASK> in the following image. Can you describe it?",
|
298 |
+
"Please elaborate on the area with the coordinates <TASK> in the visual.",
|
299 |
+
"In the displayed image, help me understand the region defined by <TASK>.",
|
300 |
+
"Regarding the image, what's going on in the section <TASK>?",
|
301 |
+
"In the given photograph, can you explain the area with coordinates <TASK>?",
|
302 |
+
"Kindly describe what I should be seeing in the area <TASK> of image.",
|
303 |
+
"Within the input image, what can be found in the region defined by <TASK>?",
|
304 |
+
"Tell me what you see within the designated area <TASK> in the picture.",
|
305 |
+
"Please detail the contents of the chosen region <TASK> in the visual input.",
|
306 |
+
"What's inside the area <TASK> of the provided graphic?",
|
307 |
+
"I'd like some information about the specific region <TASK> in the image.",
|
308 |
+
"Help me understand the details within the area <TASK> in photograph.",
|
309 |
+
"Can you break down the region <TASK> in the image for me?",
|
310 |
+
"What is taking place within the specified area <TASK> in this capture?",
|
311 |
+
"Care to elaborate on the targeted area <TASK> in the visual illustration?",
|
312 |
+
"What insights can you provide about the area <TASK> in the selected picture?",
|
313 |
+
"What does the area <TASK> within the given visual contain?",
|
314 |
+
"Analyze and describe the region <TASK> in the included photo.",
|
315 |
+
"Please provide details for the area marked as <TASK> in this photographic.",
|
316 |
+
"For the image, can you assess and describe what's happening at <TASK>?",
|
317 |
+
"Fill me in about the selected portion <TASK> within the presented image.",
|
318 |
+
"In the image, elaborate on the details found within the section <TASK>.",
|
319 |
+
"Please interpret and describe the area <TASK> inside the given picture.",
|
320 |
+
"What information can you give me about the coordinates <TASK> in image?",
|
321 |
+
"Regarding the coordinates <TASK> in image, can you provide a description?",
|
322 |
+
"In the photo, can you delve into the details of the region <TASK>?",
|
323 |
+
"Please provide insights on the specified area <TASK> within the graphic.",
|
324 |
+
"Detail the chosen region <TASK> in the depicted scene.",
|
325 |
+
"Can you discuss the entities within the region <TASK> of image?",
|
326 |
+
"I'd appreciate a breakdown of the area <TASK> in the displayed image.",
|
327 |
+
"What's the story in the section <TASK> of the included visual?",
|
328 |
+
"Please enlighten me about the region <TASK> in the given photo.",
|
329 |
+
"Offer a thorough description of the area <TASK> within the illustration.",
|
330 |
+
"What can you share about the area <TASK> in the presented image?",
|
331 |
+
"Help me grasp the context of the region <TASK> within image.",
|
332 |
+
"Kindly give an overview of the section <TASK> in photo.",
|
333 |
+
"What details can you provide about the region <TASK> in the snapshot?",
|
334 |
+
"Can you divulge the contents of the area <TASK> within the given image?",
|
335 |
+
"In the submitted image, please give a synopsis of the area <TASK>.",
|
336 |
+
"In the image, please describe the bounding box <TASK>.",
|
337 |
+
"Please describe the region <TASK> in the picture.",
|
338 |
+
"Describe the bbox <TASK> in the provided photo.",
|
339 |
+
"What can you tell me about the area <TASK> within the image?",
|
340 |
+
"Could you give me a description of the rectangular region <TASK> found in?",
|
341 |
+
"In, what elements can be found within the coordinates <TASK>?",
|
342 |
+
"Please provide details for the area within the bounding box <TASK> in.",
|
343 |
+
"Can you generate a description for the selected region <TASK> in the image?",
|
344 |
+
"Kindly describe the objects or scenery in the bounding box <TASK> within.",
|
345 |
+
"What details can you provide for the rectangle defined by the coordinates <TASK> in?",
|
346 |
+
"In relation to the picture, please describe the content of the area marked by <TASK>.",
|
347 |
+
"I'd like to know more about the area <TASK> in the given image. Can you describe it?",
|
348 |
+
"Can you help me by describing the part of that lies within the bounding box <TASK>?",
|
349 |
+
"What's happening in the section of the photo enclosed by the coordinates <TASK>?",
|
350 |
+
"Describe the image content present in the specified rectangular area <TASK> of.",
|
351 |
+
"Please provide information about the area within the bounding box <TASK> in the picture.",
|
352 |
+
"Could you offer a description of the contents in the selected area <TASK> of the image?",
|
353 |
+
"I'm curious about the area <TASK> in. Can you provide a description of it?",
|
354 |
+
"What can be observed in the rectangular region <TASK> in the photograph?",
|
355 |
+
"Please explain what is contained in the portion of defined by the box <TASK>.",
|
356 |
+
"In the photograph, can you describe the objects or scenery enclosed by <TASK>?",
|
357 |
+
"Can you give a brief explanation of the specified area <TASK> in the image?",
|
358 |
+
"What does the area <TASK> look like in the context of the image?",
|
359 |
+
"Could you please describe the contents of the bounding box <TASK> in the given image?",
|
360 |
+
"I would like to know more about the rectangular region <TASK> within the picture. Can you describe it?",
|
361 |
+
"Please tell me about the area <TASK> in the image. What does it contain?",
|
362 |
+
"Help me understand what's happening in the selected bounding box <TASK> within.",
|
363 |
+
"Can you provide a description of the area <TASK> in the image?",
|
364 |
+
"What sort of things can be seen in the region <TASK> of the photo?",
|
365 |
+
"Describe what can be found within the bounds of <TASK> in the image.",
|
366 |
+
"In, can you paint a picture of the area enclosed by coordinates <TASK>?",
|
367 |
+
"Please provide a detailed account of the area covered by the bounding box <TASK> in.",
|
368 |
+
"Give me a vivid description of what's happening in the area <TASK> within the snapshot.",
|
369 |
+
"In the image, what do you observe within the rectangular box defined by the coordinates <TASK>?",
|
370 |
+
"Could you give me a breakdown of the content in the specified area <TASK> of the picture?",
|
371 |
+
"Please elucidate the area<TASK> of the image.",
|
372 |
+
"I'd appreciate it if you could describe the portion of that lies within the rectangle <TASK>.",
|
373 |
+
"Can you share some insights about the rectangular region <TASK> in the image?",
|
374 |
+
"Help me visualize the section of the photo enclosed by the bounding box <TASK>.",
|
375 |
+
"Would you kindly provide a description for the content within the rectangular area <TASK> of?",
|
376 |
+
"In, can you tell me more about the area specified by the bounding box <TASK>?",
|
377 |
+
"Please describe what can be seen in the rectangular region <TASK> of the image.",
|
378 |
+
"Can you analyze the content of the area <TASK> within the photograph?",
|
379 |
+
"In the provided image, please explain the content within the region <TASK>.",
|
380 |
+
"I'm interested in the selected rectangle <TASK> in. Can you tell me more about it?",
|
381 |
+
"Explain what can be found in the bounding box <TASK> in the context of the image.",
|
382 |
+
"Kindly share your observations about the rectangular region <TASK> within.",
|
383 |
+
"I'd like a thorough description of the area <TASK> in the image.",
|
384 |
+
"Could you please provide a description of the rectangular area <TASK> in?",
|
385 |
+
"Please describe the section of the picture defined by the bbox <TASK>.",
|
386 |
+
"Tell me more about the scenery or objects within the rectangular region <TASK> in.",
|
387 |
+
"Would you kindly describe the content of the area enclosed by <TASK> in the image?",
|
388 |
+
"Help me understand the objects or scenery within the bounding box <TASK> in the image.",
|
389 |
+
"I would like to know about the section of the image enclosed by the rectangle <TASK>. Can you describe it?",
|
390 |
+
"Describe the selected rectangular area <TASK> in the photo.",
|
391 |
+
"Tell me about the region <TASK> of the image.",
|
392 |
+
"I request a description of the area <TASK> in the picture.",
|
393 |
+
"Can you elaborate on the content of the bounding box <TASK> in?",
|
394 |
+
"Please share details about the rectangular region <TASK> within the image.",
|
395 |
+
"What can I find in the bbox <TASK> of the provided image?",
|
396 |
+
"In the image, could you provide a description for the coordinates <TASK>?",
|
397 |
+
"Could you tell me more about the area <TASK> in the snapshot?",
|
398 |
+
"Fill me in on the details of the rectangular box <TASK> within the image.",
|
399 |
+
"What's going on in the section of contained within the bounding box <TASK>?",
|
400 |
+
"I would like a description of the content within the bbox <TASK> in.",
|
401 |
+
"Please enlighten me about the area <TASK> in the photograph.",
|
402 |
+
"Can you give me a visual rundown of the area <TASK> in?",
|
403 |
+
"Describe the visual elements within the selected area <TASK> of the image.",
|
404 |
+
"Tell me what you see in the area <TASK> within the context of the image.",
|
405 |
+
"Explain the content within the rectangular region <TASK> of the image.",
|
406 |
+
"I'd like some information about the bounding box <TASK> in the photo.",
|
407 |
+
"What is happening within the rectangle defined by coordinates <TASK> in the image?",
|
408 |
+
"Please describe the content within the area <TASK> displayed in the image.",
|
409 |
+
"What can be seen in the bounding box <TASK> in the context of the provided image?",
|
410 |
+
"Share some details about the objects or environment within the bounding box <TASK> in.",
|
411 |
+
"Please describe the area <TASK> in the image for me.",
|
412 |
+
"Can you generate a description of the contents within the selected region <TASK> in?",
|
413 |
+
"What objects or scenery can be found in the area <TASK> in the image?",
|
414 |
+
"Please tell me more about the rectangular section <TASK> in the photo.",
|
415 |
+
"Could you describe the content of the bbox <TASK> in the image?",
|
416 |
+
"What does the selected region <TASK> in the image encompass?",
|
417 |
+
"I am interested in the region <TASK> of the image; please describe it.",
|
418 |
+
"Can you provide some context for the area <TASK> within the picture?",
|
419 |
+
"Please give me some details about the rectangle <TASK> in the image.",
|
420 |
+
"In the photo, what can you see within the region defined by the bounding box <TASK>?",
|
421 |
+
"I would like a detailed description of the portion of enclosed by the bbox <TASK>.",
|
422 |
+
"Please help me understand the content present within the rectangle <TASK> in.",
|
423 |
+
"Would you mind describing the rectangular area <TASK> in the provided image?"
|
424 |
+
]
|