Nishgop commited on
Commit
18a3f68
1 Parent(s): d907bd6

Create utils.py

Browse files
Files changed (1) hide show
  1. utils.py +424 -0
utils.py ADDED
@@ -0,0 +1,424 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import seaborn as sns
2
+ from PIL import Image, ImageDraw, ImageFont
3
+ import matplotlib.font_manager
4
+ import spacy
5
+ import re
6
+ import base64
7
+ import time
8
+ import re
9
+ from PIL import Image
10
+ import base64
11
+ import hashlib
12
+ import os
13
+
14
+ nlp = spacy.load("en_core_web_sm-3.6.0")
15
+
16
+ def process_image_without_resize(image_prompt):
17
+ image = Image.open(image_prompt)
18
+ print(f"height:{image.height}, width:{image.width}")
19
+ timestamp = time.time()
20
+ file_ext = os.path.splitext(image_prompt)[1]
21
+ filename = f"examples/{timestamp}{file_ext}"
22
+ filename_grounding = f"examples/{timestamp}_grounding{file_ext}"
23
+ image.save(filename)
24
+ print(f"temporal filename {filename}")
25
+ with open(filename, "rb") as image_file:
26
+ bytes = base64.b64encode(image_file.read())
27
+ encoded_img = str(bytes, encoding='utf-8')
28
+ image_hash = hashlib.sha256(bytes).hexdigest()
29
+ os.remove(filename)
30
+ return image, encoded_img, image_hash, filename_grounding
31
+
32
+
33
+ def is_chinese(text):
34
+ zh_pattern = re.compile(u'[\u4e00-\u9fa5]+')
35
+ return zh_pattern.search(text)
36
+
37
+
38
+ def draw_boxes(image, boxes, texts, output_fn='output.png'):
39
+ box_width = 5
40
+ color_palette = sns.color_palette("husl", len(boxes))
41
+ colors = [(int(r*255), int(g*255), int(b*255)) for r, g, b in color_palette]
42
+
43
+ width, height = image.size
44
+ absolute_boxes = [[(int(box[0] * width), int(box[1] * height), int(box[2] * width), int(box[3] * height)) for box in b] for b in boxes]
45
+
46
+ overlay = Image.new('RGBA', image.size, (255, 255, 255, 0))
47
+ draw = ImageDraw.Draw(overlay)
48
+ font_path = sorted(matplotlib.font_manager.findSystemFonts(fontpaths=None, fontext='ttf'))[0]
49
+ font = ImageFont.truetype(font_path, size=26)
50
+
51
+ for box, text, color in zip(absolute_boxes, texts, colors):
52
+ for b in box:
53
+ draw.rectangle(b, outline=color, width=box_width)
54
+ if not text:
55
+ continue
56
+ splited_text = text.split('\n')
57
+ num_lines = len(splited_text)
58
+ text_width, text_height = font.getbbox(splited_text[0])[-2:]
59
+ y_start = b[3] - text_height * num_lines - box_width
60
+ if b[2] - b[0] < 100 or b[3] - b[1] < 100:
61
+ y_start = b[3]
62
+ for i, line in enumerate(splited_text):
63
+ text_width, text_height = font.getbbox(line)[-2:]
64
+ x = b[0] + box_width
65
+ y = y_start + text_height * i
66
+ draw.rectangle([x, y, x+text_width, y+text_height], fill=(128, 128, 128, 160))
67
+ draw.text((x, y), line, font=font, fill=(255, 255, 255))
68
+ img_with_overlay = Image.alpha_composite(image.convert('RGBA'), overlay).convert('RGB')
69
+ img_with_overlay.save(output_fn)
70
+
71
+ def boxstr_to_boxes(box_str):
72
+ boxes = [[int(y)/1000 for y in x.split(',')] for x in box_str.split(';') if x.replace(',', '').isdigit()]
73
+ return boxes
74
+
75
+ def text_to_dict(text):
76
+ doc = nlp(text)
77
+
78
+ box_matches = list(re.finditer(r'\[\[([^\]]+)\]\]', text))
79
+ box_positions = [match.start() for match in box_matches]
80
+
81
+ noun_phrases = []
82
+ boxes = []
83
+
84
+ for match, box_position in zip(box_matches, box_positions):
85
+ nearest_np_start = max([0] + [chunk.start_char for chunk in doc.noun_chunks if chunk.end_char <= box_position])
86
+ noun_phrase = text[nearest_np_start:box_position].strip()
87
+ if noun_phrase and noun_phrase[-1] == '?':
88
+ noun_phrase = text[:box_position].strip()
89
+ box_string = match.group(1)
90
+
91
+ noun_phrases.append(noun_phrase)
92
+ boxes.append(boxstr_to_boxes(box_string))
93
+
94
+ pairs = []
95
+ for noun_phrase, box_string in zip(noun_phrases, boxes):
96
+ pairs.append((noun_phrase.lower(), box_string))
97
+ return dict(pairs)
98
+
99
+ def parse_response(img, response, output_fn='output.png'):
100
+ img = img.convert('RGB')
101
+ width, height = img.size
102
+ ratio = min(1920 / width, 1080 / height)
103
+ new_width = int(width * ratio)
104
+ new_height = int(height * ratio)
105
+ new_img = img.resize((new_width, new_height), Image.LANCZOS)
106
+ pattern = r"\[\[(.*?)\]\]"
107
+ positions = re.findall(pattern, response)
108
+ boxes = [[[int(y) for y in x.split(',')] for x in pos.split(';') if x.replace(',', '').isdigit()] for pos in positions]
109
+ dic = text_to_dict(response)
110
+ if not dic:
111
+ texts = []
112
+ boxes = []
113
+ else:
114
+ texts, boxes = zip(*dic.items())
115
+ draw_boxes(new_img, boxes, texts, output_fn=output_fn)
116
+
117
+ def postprocess_text(template, text):
118
+ quoted_text = f'"{text.strip()}"'
119
+ return template.replace("<TASK>", quoted_text).strip() if template != "" else text.strip()
120
+
121
+
122
+ # The templates is for CogAgent_Agent Template
123
+ templates_agent_cogagent = [
124
+ "do not use template",
125
+ "Can you advise me on how to <TASK>?",
126
+ "I'm looking for guidance on how to <TASK>.",
127
+ "What steps do I need to take to <TASK>?",
128
+ "Could you provide instructions for <TASK>?",
129
+ "I'm wondering what the process is for <TASK>.",
130
+ "How can I go about <TASK>?",
131
+ "I need assistance with planning to <TASK>.",
132
+ "Do you have any recommendations for <TASK>?",
133
+ "Please share some tips for <TASK>.",
134
+ "I'd like to know the best way to <TASK>.",
135
+ "What's the most effective way to <TASK>?",
136
+ "I'm seeking advice on accomplishing <TASK>.",
137
+ "Could you guide me through the steps to <TASK>?",
138
+ "I'm unsure how to start with <TASK>.",
139
+ "Is there a strategy for successfully <TASK>?",
140
+ "What's the proper procedure for <TASK>?",
141
+ "How should I prepare for <TASK>?",
142
+ "I'm not sure where to begin with <TASK>.",
143
+ "I need some insights on <TASK>.",
144
+ "Can you explain how to tackle <TASK>?",
145
+ "I'm interested in the process of <TASK>.",
146
+ "Could you enlighten me on <TASK>?",
147
+ "What are the recommended steps for <TASK>?",
148
+ "Is there a preferred method for <TASK>?",
149
+ "I'd appreciate your advice on <TASK>.",
150
+ "Can you shed light on <TASK>?",
151
+ "What would be the best approach to <TASK>?",
152
+ "How do I get started with <TASK>?",
153
+ "I'm inquiring about the procedure for <TASK>.",
154
+ "Could you share your expertise on <TASK>?",
155
+ "I'd like some guidance on <TASK>.",
156
+ "What's your recommendation for <TASK>?",
157
+ "I'm seeking your input on how to <TASK>.",
158
+ "Can you provide some insights into <TASK>?",
159
+ "How can I successfully accomplish <TASK>?",
160
+ "What steps are involved in <TASK>?",
161
+ "I'm curious about the best way to <TASK>.",
162
+ "Could you show me the ropes for <TASK>?",
163
+ "I need to know how to go about <TASK>.",
164
+ "What are the essential steps for <TASK>?",
165
+ "Is there a specific method for <TASK>?",
166
+ "I'd like to get some advice on <TASK>.",
167
+ "Can you explain the process of <TASK>?",
168
+ "I'm looking for guidance on how to approach <TASK>.",
169
+ "What's the proper way to handle <TASK>?",
170
+ "How should I proceed with <TASK>?",
171
+ "I'm interested in your expertise on <TASK>.",
172
+ "Could you walk me through the steps for <TASK>?",
173
+ "I'm not sure where to begin when it comes to <TASK>.",
174
+ "What should I prioritize when doing <TASK>?",
175
+ "How can I ensure success with <TASK>?",
176
+ "I'd appreciate some tips on <TASK>.",
177
+ "Can you provide a roadmap for <TASK>?",
178
+ "What's the recommended course of action for <TASK>?",
179
+ "I'm seeking your guidance on <TASK>.",
180
+ "Could you offer some suggestions for <TASK>?",
181
+ "I'd like to know the steps to take for <TASK>.",
182
+ "What's the most effective way to achieve <TASK>?",
183
+ "How can I make the most of <TASK>?",
184
+ "I'm wondering about the best approach to <TASK>.",
185
+ "Can you share your insights on <TASK>?",
186
+ "What steps should I follow to complete <TASK>?",
187
+ "I'm looking for advice on <TASK>.",
188
+ "What's the strategy for successfully completing <TASK>?",
189
+ "How should I prepare myself for <TASK>?",
190
+ "I'm not sure where to start with <TASK>.",
191
+ "What's the procedure for <TASK>?",
192
+ "Could you provide some guidance on <TASK>?",
193
+ "I'd like to get some tips on how to <TASK>.",
194
+ "Can you explain how to tackle <TASK> step by step?",
195
+ "I'm interested in understanding the process of <TASK>.",
196
+ "What are the key steps to <TASK>?",
197
+ "Is there a specific method that works for <TASK>?",
198
+ "I'd appreciate your advice on successfully completing <TASK>.",
199
+ "Can you shed light on the best way to <TASK>?",
200
+ "What would you recommend as the first step to <TASK>?",
201
+ "How do I initiate <TASK>?",
202
+ "I'm inquiring about the recommended steps for <TASK>.",
203
+ "Could you share some insights into <TASK>?",
204
+ "I'm seeking your expertise on <TASK>.",
205
+ "What's your recommended approach for <TASK>?",
206
+ "I'd like some guidance on where to start with <TASK>.",
207
+ "Can you provide recommendations for <TASK>?",
208
+ "What's your advice for someone looking to <TASK>?",
209
+ "I'm seeking your input on the process of <TASK>.",
210
+ "How can I achieve success with <TASK>?",
211
+ "What's the best way to navigate <TASK>?",
212
+ "I'm curious about the steps required for <TASK>.",
213
+ "Could you show me the proper way to <TASK>?",
214
+ "I need to know the necessary steps for <TASK>.",
215
+ "What's the most efficient method for <TASK>?",
216
+ "I'd appreciate your guidance on <TASK>.",
217
+ "Can you explain the steps involved in <TASK>?",
218
+ "I'm looking for recommendations on how to approach <TASK>.",
219
+ "What's the right way to handle <TASK>?",
220
+ "How should I manage <TASK>?",
221
+ "I'm interested in your insights on <TASK>.",
222
+ "Could you provide a step-by-step guide for <TASK>?",
223
+ "I'm not sure how to start when it comes to <TASK>.",
224
+ "What are the key factors to consider for <TASK>?",
225
+ "How can I ensure a successful outcome with <TASK>?",
226
+ "I'd like some tips and tricks for <TASK>.",
227
+ "Can you offer a roadmap for accomplishing <TASK>?",
228
+ "What's the preferred course of action for <TASK>?",
229
+ "I'm seeking your expert advice on <TASK>.",
230
+ "Could you suggest some best practices for <TASK>?",
231
+ "I'd like to understand the necessary steps to complete <TASK>.",
232
+ "What's the most effective strategy for <TASK>?",
233
+ ]
234
+
235
+ template_grounding_cogvlm = [
236
+ "Where is <TASK>?",
237
+ "Where is <TASK> in the image?",
238
+ "Where is <TASK>? answer in [[x0,y0,x1,y1]] format.",
239
+ "Can you point out <TASK> in the image and provide the bounding boxes of its location?",
240
+ "Help me to locate <TASK> in and give me its bounding boxes, please.",
241
+ "In the given, could you find and tell me the bounding boxes of <TASK>?",
242
+ "Guide me to the location of <TASK> within the image by providing its bounding boxes.",
243
+ "I'd like to know the exact bounding boxes of <TASK> in the photo.",
244
+ "Would you kindly provide the bounding boxes of <TASK> located in the picture?",
245
+ "Can you find <TASK> in and give me the bounding boxes of where it is located?",
246
+ "I'm trying to locate <TASK> in. Can you determine its bounding boxes for me?",
247
+ "What are the bounding boxes of <TASK> in the image?",
248
+ "Can you disclose the position of <TASK> in the photograph by stating its bounding boxes?",
249
+ "In, could you let me know the location of <TASK> in the form of bounding boxes?",
250
+ "I need the bounding boxes of <TASK> in, can you please assist me with that?",
251
+ "Where in is <TASK> located? Provide me with its bounding boxes, please.",
252
+ "May I have the bounding boxes of <TASK>?",
253
+ "In the photograph, could you pinpoint the location of <TASK> and tell me its bounding boxes?",
254
+ "Can you please search and find <TASK> in, then let me know its bounding boxes?",
255
+ "Please, point out the position of <TASK> in the image by giving its bounding boxes.",
256
+ "What are the exact bounding boxes of <TASK> in the provided picture?",
257
+ "Detect the location of <TASK> in and share the bounding boxes with me, please.",
258
+ "In the picture, I'd like you to locate <TASK> and provide its coordinates.",
259
+ "Please indicate the location of <TASK> in the photo by giving bounding boxes.",
260
+ "Find <TASK> in and share its coordinates with me.",
261
+ "Could you please help me find the bounding boxes of <TASK> in the image?",
262
+ "I am looking for the position of <TASK> in. Can you provide its bounding boxes?",
263
+ "In the image, can you locate <TASK> and let me know its coordinates?",
264
+ "I'd appreciate if you could find and tell me the bounding boxes of <TASK>.",
265
+ "In, I need the bounding box bounding boxes of <TASK>.",
266
+ "Point me to the location of <TASK> in the picture by providing its bounding boxes.",
267
+ "Could you trace <TASK> in and tell me its bounding boxes?",
268
+ "Can you assist me in locating <TASK> in, and then provide its bounding boxes?",
269
+ "I'm curious, what are the bounding boxes of <TASK> in the photo?",
270
+ "Kindly share the bounding boxes of <TASK> located in the image.",
271
+ "I would like to find <TASK> in. Can you give me its bounding boxes?",
272
+ "Can you spot <TASK> in and disclose its bounding boxes to me?",
273
+ "Please, reveal the location of <TASK> in the provided photograph as coordinates.",
274
+ "Help me locate and determine the bounding boxes of <TASK>.",
275
+ "I request the bounding boxes of <TASK> in the image.",
276
+ "In the given, can you find <TASK> and tell me its bounding boxes?",
277
+ "I need to know the position of <TASK> in as bounding boxes.",
278
+ "Locate <TASK> in and provide its bounding boxes, please.",
279
+ "Assist me in finding <TASK> in the photo and provide the bounding box bounding boxes.",
280
+ "In, can you guide me to the location of <TASK> by providing bounding boxes?",
281
+ "I'd like the bounding boxes of <TASK> as it appears in the image.",
282
+ "What location does <TASK> hold in the picture? Inform me of its bounding boxes.",
283
+ "Identify the position of <TASK> in and share its bounding boxes.",
284
+ "I'd like to request the bounding boxes of <TASK> within the photo.",
285
+ "How can I locate <TASK> in the image? Please provide the bounding boxes.",
286
+ "I am interested in knowing the bounding boxes of <TASK> in the picture.",
287
+ "Assist me in locating the position of <TASK> in the photograph and its bounding box bounding boxes.",
288
+ "In the image, I need to find <TASK> and know its bounding boxes. Can you please help?"
289
+ "Can you give me a description of the region <TASK> in image?",
290
+ "In the provided image, would you mind describing the selected area <TASK>?",
291
+ "I need details about the area <TASK> located within image.",
292
+ "Could you please share some information on the region <TASK> in this photograph?",
293
+ "Describe what's happening within the coordinates <TASK> of the given image.",
294
+ "What can you tell me about the selected region <TASK> in the photo?",
295
+ "Please, can you help me understand what's inside the region <TASK> in image?",
296
+ "Give me a comprehensive description of the specified area <TASK> in the picture.",
297
+ "I'm curious about the area <TASK> in the following image. Can you describe it?",
298
+ "Please elaborate on the area with the coordinates <TASK> in the visual.",
299
+ "In the displayed image, help me understand the region defined by <TASK>.",
300
+ "Regarding the image, what's going on in the section <TASK>?",
301
+ "In the given photograph, can you explain the area with coordinates <TASK>?",
302
+ "Kindly describe what I should be seeing in the area <TASK> of image.",
303
+ "Within the input image, what can be found in the region defined by <TASK>?",
304
+ "Tell me what you see within the designated area <TASK> in the picture.",
305
+ "Please detail the contents of the chosen region <TASK> in the visual input.",
306
+ "What's inside the area <TASK> of the provided graphic?",
307
+ "I'd like some information about the specific region <TASK> in the image.",
308
+ "Help me understand the details within the area <TASK> in photograph.",
309
+ "Can you break down the region <TASK> in the image for me?",
310
+ "What is taking place within the specified area <TASK> in this capture?",
311
+ "Care to elaborate on the targeted area <TASK> in the visual illustration?",
312
+ "What insights can you provide about the area <TASK> in the selected picture?",
313
+ "What does the area <TASK> within the given visual contain?",
314
+ "Analyze and describe the region <TASK> in the included photo.",
315
+ "Please provide details for the area marked as <TASK> in this photographic.",
316
+ "For the image, can you assess and describe what's happening at <TASK>?",
317
+ "Fill me in about the selected portion <TASK> within the presented image.",
318
+ "In the image, elaborate on the details found within the section <TASK>.",
319
+ "Please interpret and describe the area <TASK> inside the given picture.",
320
+ "What information can you give me about the coordinates <TASK> in image?",
321
+ "Regarding the coordinates <TASK> in image, can you provide a description?",
322
+ "In the photo, can you delve into the details of the region <TASK>?",
323
+ "Please provide insights on the specified area <TASK> within the graphic.",
324
+ "Detail the chosen region <TASK> in the depicted scene.",
325
+ "Can you discuss the entities within the region <TASK> of image?",
326
+ "I'd appreciate a breakdown of the area <TASK> in the displayed image.",
327
+ "What's the story in the section <TASK> of the included visual?",
328
+ "Please enlighten me about the region <TASK> in the given photo.",
329
+ "Offer a thorough description of the area <TASK> within the illustration.",
330
+ "What can you share about the area <TASK> in the presented image?",
331
+ "Help me grasp the context of the region <TASK> within image.",
332
+ "Kindly give an overview of the section <TASK> in photo.",
333
+ "What details can you provide about the region <TASK> in the snapshot?",
334
+ "Can you divulge the contents of the area <TASK> within the given image?",
335
+ "In the submitted image, please give a synopsis of the area <TASK>.",
336
+ "In the image, please describe the bounding box <TASK>.",
337
+ "Please describe the region <TASK> in the picture.",
338
+ "Describe the bbox <TASK> in the provided photo.",
339
+ "What can you tell me about the area <TASK> within the image?",
340
+ "Could you give me a description of the rectangular region <TASK> found in?",
341
+ "In, what elements can be found within the coordinates <TASK>?",
342
+ "Please provide details for the area within the bounding box <TASK> in.",
343
+ "Can you generate a description for the selected region <TASK> in the image?",
344
+ "Kindly describe the objects or scenery in the bounding box <TASK> within.",
345
+ "What details can you provide for the rectangle defined by the coordinates <TASK> in?",
346
+ "In relation to the picture, please describe the content of the area marked by <TASK>.",
347
+ "I'd like to know more about the area <TASK> in the given image. Can you describe it?",
348
+ "Can you help me by describing the part of that lies within the bounding box <TASK>?",
349
+ "What's happening in the section of the photo enclosed by the coordinates <TASK>?",
350
+ "Describe the image content present in the specified rectangular area <TASK> of.",
351
+ "Please provide information about the area within the bounding box <TASK> in the picture.",
352
+ "Could you offer a description of the contents in the selected area <TASK> of the image?",
353
+ "I'm curious about the area <TASK> in. Can you provide a description of it?",
354
+ "What can be observed in the rectangular region <TASK> in the photograph?",
355
+ "Please explain what is contained in the portion of defined by the box <TASK>.",
356
+ "In the photograph, can you describe the objects or scenery enclosed by <TASK>?",
357
+ "Can you give a brief explanation of the specified area <TASK> in the image?",
358
+ "What does the area <TASK> look like in the context of the image?",
359
+ "Could you please describe the contents of the bounding box <TASK> in the given image?",
360
+ "I would like to know more about the rectangular region <TASK> within the picture. Can you describe it?",
361
+ "Please tell me about the area <TASK> in the image. What does it contain?",
362
+ "Help me understand what's happening in the selected bounding box <TASK> within.",
363
+ "Can you provide a description of the area <TASK> in the image?",
364
+ "What sort of things can be seen in the region <TASK> of the photo?",
365
+ "Describe what can be found within the bounds of <TASK> in the image.",
366
+ "In, can you paint a picture of the area enclosed by coordinates <TASK>?",
367
+ "Please provide a detailed account of the area covered by the bounding box <TASK> in.",
368
+ "Give me a vivid description of what's happening in the area <TASK> within the snapshot.",
369
+ "In the image, what do you observe within the rectangular box defined by the coordinates <TASK>?",
370
+ "Could you give me a breakdown of the content in the specified area <TASK> of the picture?",
371
+ "Please elucidate the area<TASK> of the image.",
372
+ "I'd appreciate it if you could describe the portion of that lies within the rectangle <TASK>.",
373
+ "Can you share some insights about the rectangular region <TASK> in the image?",
374
+ "Help me visualize the section of the photo enclosed by the bounding box <TASK>.",
375
+ "Would you kindly provide a description for the content within the rectangular area <TASK> of?",
376
+ "In, can you tell me more about the area specified by the bounding box <TASK>?",
377
+ "Please describe what can be seen in the rectangular region <TASK> of the image.",
378
+ "Can you analyze the content of the area <TASK> within the photograph?",
379
+ "In the provided image, please explain the content within the region <TASK>.",
380
+ "I'm interested in the selected rectangle <TASK> in. Can you tell me more about it?",
381
+ "Explain what can be found in the bounding box <TASK> in the context of the image.",
382
+ "Kindly share your observations about the rectangular region <TASK> within.",
383
+ "I'd like a thorough description of the area <TASK> in the image.",
384
+ "Could you please provide a description of the rectangular area <TASK> in?",
385
+ "Please describe the section of the picture defined by the bbox <TASK>.",
386
+ "Tell me more about the scenery or objects within the rectangular region <TASK> in.",
387
+ "Would you kindly describe the content of the area enclosed by <TASK> in the image?",
388
+ "Help me understand the objects or scenery within the bounding box <TASK> in the image.",
389
+ "I would like to know about the section of the image enclosed by the rectangle <TASK>. Can you describe it?",
390
+ "Describe the selected rectangular area <TASK> in the photo.",
391
+ "Tell me about the region <TASK> of the image.",
392
+ "I request a description of the area <TASK> in the picture.",
393
+ "Can you elaborate on the content of the bounding box <TASK> in?",
394
+ "Please share details about the rectangular region <TASK> within the image.",
395
+ "What can I find in the bbox <TASK> of the provided image?",
396
+ "In the image, could you provide a description for the coordinates <TASK>?",
397
+ "Could you tell me more about the area <TASK> in the snapshot?",
398
+ "Fill me in on the details of the rectangular box <TASK> within the image.",
399
+ "What's going on in the section of contained within the bounding box <TASK>?",
400
+ "I would like a description of the content within the bbox <TASK> in.",
401
+ "Please enlighten me about the area <TASK> in the photograph.",
402
+ "Can you give me a visual rundown of the area <TASK> in?",
403
+ "Describe the visual elements within the selected area <TASK> of the image.",
404
+ "Tell me what you see in the area <TASK> within the context of the image.",
405
+ "Explain the content within the rectangular region <TASK> of the image.",
406
+ "I'd like some information about the bounding box <TASK> in the photo.",
407
+ "What is happening within the rectangle defined by coordinates <TASK> in the image?",
408
+ "Please describe the content within the area <TASK> displayed in the image.",
409
+ "What can be seen in the bounding box <TASK> in the context of the provided image?",
410
+ "Share some details about the objects or environment within the bounding box <TASK> in.",
411
+ "Please describe the area <TASK> in the image for me.",
412
+ "Can you generate a description of the contents within the selected region <TASK> in?",
413
+ "What objects or scenery can be found in the area <TASK> in the image?",
414
+ "Please tell me more about the rectangular section <TASK> in the photo.",
415
+ "Could you describe the content of the bbox <TASK> in the image?",
416
+ "What does the selected region <TASK> in the image encompass?",
417
+ "I am interested in the region <TASK> of the image; please describe it.",
418
+ "Can you provide some context for the area <TASK> within the picture?",
419
+ "Please give me some details about the rectangle <TASK> in the image.",
420
+ "In the photo, what can you see within the region defined by the bounding box <TASK>?",
421
+ "I would like a detailed description of the portion of enclosed by the bbox <TASK>.",
422
+ "Please help me understand the content present within the rectangle <TASK> in.",
423
+ "Would you mind describing the rectangular area <TASK> in the provided image?"
424
+ ]