diff --git "a/entity_val2017.json" "b/entity_val2017.json"
new file mode 100644--- /dev/null
+++ "b/entity_val2017.json"
@@ -0,0 +1 @@
+{"annotations": [{"image_id": 139, "sentence": "In the image, a large, black, flat-screen TV with a silver frame is placed on a wooden stand, while a table is situated nearby in the living room.", "sentence_raw": "In the image, [2038814] is placed on a wooden stand, while [7238567] is situated nearby in the living room.", "phrase": [{"annotation_id": "2038814", "phrase": "a large, black, flat-screen TV with a silver frame", "phrase_raw": "[2038814]", "_start_idx": 14, "start_idx": 13, "end_idx": 64}, {"annotation_id": "7238567", "phrase": "a table", "phrase_raw": "[7238567]", "_start_idx": 100, "start_idx": 99, "end_idx": 107}]}, {"image_id": 285, "sentence": "A large brown bear sitting on the grass, looking at the camera with its thick, fluffy fur.", "sentence_raw": "[5931152] sitting on [3834981], looking at the camera with its thick, fluffy fur.", "phrase": [{"annotation_id": "5931152", "phrase": "A large brown bear", "phrase_raw": "[5931152]", "_start_idx": 0, "start_idx": 0, "end_idx": 18}, {"annotation_id": "3834981", "phrase": "the grass", "phrase_raw": "[3834981]", "_start_idx": 30, "start_idx": 29, "end_idx": 39}]}, {"image_id": 632, "sentence": "A green and white leafy potted plant sits near a cozy bed with a blue comforter, creating a relaxing atmosphere in the bedroom.", "sentence_raw": "[2701869] sits near [3286041], creating a relaxing atmosphere in the bedroom.", "phrase": [{"annotation_id": "2701869", "phrase": "A green and white leafy potted plant", "phrase_raw": "[2701869]", "_start_idx": 0, "start_idx": 0, "end_idx": 36}, {"annotation_id": "3286041", "phrase": "a cozy bed with a blue comforter", "phrase_raw": "[3286041]", "_start_idx": 47, "start_idx": 46, "end_idx": 79}]}, {"image_id": 724, "sentence": "An upside-down stop sign on a metal pole at a street corner, with trees in the background and an empty parking lot.", "sentence_raw": "[3813724] on a metal pole at a street corner, with [5600377] in the background and an empty parking lot.", "phrase": [{"annotation_id": "3813724", "phrase": "An upside-down stop sign", "phrase_raw": "[3813724]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "5600377", "phrase": "trees", "phrase_raw": "[5600377]", "_start_idx": 66, "start_idx": 65, "end_idx": 71}]}, {"image_id": 776, "sentence": "A brown teddy bear sitting with a large, fluffy teddy bear on a bed covered in a blue blanket.", "sentence_raw": "[2707318] sitting with [4217973] on [7562308].", "phrase": [{"annotation_id": "2707318", "phrase": "A brown teddy bear", "phrase_raw": "[2707318]", "_start_idx": 0, "start_idx": 0, "end_idx": 18}, {"annotation_id": "4217973", "phrase": "a large, fluffy teddy bear", "phrase_raw": "[4217973]", "_start_idx": 32, "start_idx": 31, "end_idx": 58}, {"annotation_id": "7562308", "phrase": "a bed covered in a blue blanket", "phrase_raw": "[7562308]", "_start_idx": 62, "start_idx": 61, "end_idx": 93}]}, {"image_id": 785, "sentence": "A woman in a red jacket skiing down a snow-covered slope with black and white skis.", "sentence_raw": "[3287629] skiing down [14144467] with [8684420].", "phrase": [{"annotation_id": "3287629", "phrase": "A woman in a red jacket", "phrase_raw": "[3287629]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "14144467", "phrase": "a snow-covered slope", "phrase_raw": "[14144467]", "_start_idx": 36, "start_idx": 35, "end_idx": 56}, {"annotation_id": "8684420", "phrase": "black and white skis", "phrase_raw": "[8684420]", "_start_idx": 62, "start_idx": 61, "end_idx": 82}]}, {"image_id": 802, "sentence": "A white oven with a stainless steel door sits next to a white double-door refrigerator in a small, well-organized kitchen with wooden cabinets and a wooden floor.", "sentence_raw": "[6316128] sits next to [8552830] in a small, well-organized kitchen with [2045786] and a [4607831].", "phrase": [{"annotation_id": "6316128", "phrase": "A white oven with a stainless steel door", "phrase_raw": "[6316128]", "_start_idx": 0, "start_idx": 0, "end_idx": 40}, {"annotation_id": "8552830", "phrase": "a white double-door refrigerator", "phrase_raw": "[8552830]", "_start_idx": 54, "start_idx": 53, "end_idx": 86}, {"annotation_id": "2045786", "phrase": "wooden cabinets", "phrase_raw": "[2045786]", "_start_idx": 127, "start_idx": 126, "end_idx": 142}, {"annotation_id": "4607831", "phrase": "wooden floor", "phrase_raw": "[4607831]", "_start_idx": 149, "start_idx": 148, "end_idx": 161}]}, {"image_id": 872, "sentence": "A baseball player in a green and white uniform is in the middle of a play on the playing field.", "sentence_raw": "[8620683] is in the middle of a play on [11914466].", "phrase": [{"annotation_id": "8620683", "phrase": "A baseball player in a green and white uniform", "phrase_raw": "[8620683]", "_start_idx": 0, "start_idx": 0, "end_idx": 46}, {"annotation_id": "11914466", "phrase": "the playing field", "phrase_raw": "[11914466]", "_start_idx": 77, "start_idx": 76, "end_idx": 94}]}, {"image_id": 885, "sentence": "A man in a blue and white outfit is playing tennis, holding a red and white tennis racket while a woman in a blue shirt and white hat watches the match.", "sentence_raw": "[6775400] is playing tennis, holding a [7378081] while [2696745] watches the match.", "phrase": [{"annotation_id": "6775400", "phrase": "A man in a blue and white outfit", "phrase_raw": "[6775400]", "_start_idx": 0, "start_idx": 0, "end_idx": 32}, {"annotation_id": "7378081", "phrase": "red and white tennis racket", "phrase_raw": "[7378081]", "_start_idx": 62, "start_idx": 61, "end_idx": 89}, {"annotation_id": "2696745", "phrase": "a woman in a blue shirt and white hat", "phrase_raw": "[2696745]", "_start_idx": 96, "start_idx": 95, "end_idx": 133}]}, {"image_id": 1000, "sentence": "A young boy in a red shirt and a boy in a white shirt holding a tennis racket pose with three young people in baseball caps on a tennis court.", "sentence_raw": "[3421582] and [6053739] pose with [5859200] on a tennis court.", "phrase": [{"annotation_id": "3421582", "phrase": "A young boy in a red shirt", "phrase_raw": "[3421582]", "_start_idx": 0, "start_idx": 0, "end_idx": 26}, {"annotation_id": "6053739", "phrase": "a boy in a white shirt holding a tennis racket", "phrase_raw": "[6053739]", "_start_idx": 31, "start_idx": 30, "end_idx": 77}, {"annotation_id": "5859200", "phrase": "three young people in baseball caps", "phrase_raw": "[5859200]", "_start_idx": 88, "start_idx": 87, "end_idx": 123}]}, {"image_id": 1268, "sentence": "A woman taking a picture of a white swan swimming in the water, with a bridge in the background and a pavement nearby.", "sentence_raw": "[1447707] taking a picture of [5985877] swimming in the water, with [3027511] in the background and [3288623] nearby.", "phrase": [{"annotation_id": "1447707", "phrase": "A woman", "phrase_raw": "[1447707]", "_start_idx": 0, "start_idx": 0, "end_idx": 7}, {"annotation_id": "5985877", "phrase": "a white swan", "phrase_raw": "[5985877]", "_start_idx": 28, "start_idx": 27, "end_idx": 40}, {"annotation_id": "3027511", "phrase": "a bridge", "phrase_raw": "[3027511]", "_start_idx": 69, "start_idx": 68, "end_idx": 77}, {"annotation_id": "3288623", "phrase": "a pavement", "phrase_raw": "[3288623]", "_start_idx": 100, "start_idx": 99, "end_idx": 110}]}, {"image_id": 1296, "sentence": "A woman wearing a white shirt holds a Hello Kitty cell phone in her hand, possibly taking a picture or looking at the screen.", "sentence_raw": "[2698051] wearing a white shirt holds [12168132] in her hand, possibly taking a picture or looking at the screen.", "phrase": [{"annotation_id": "2698051", "phrase": "A woman", "phrase_raw": "[2698051]", "_start_idx": 0, "start_idx": 0, "end_idx": 7}, {"annotation_id": "12168132", "phrase": "a Hello Kitty cell phone", "phrase_raw": "[12168132]", "_start_idx": 36, "start_idx": 35, "end_idx": 60}]}, {"image_id": 1353, "sentence": "A young boy in a black leather jacket is enjoying a ride at an amusement park, sitting on the red and gold train.", "sentence_raw": "[988966] is enjoying a ride at an amusement park, sitting on the [926018].", "phrase": [{"annotation_id": "988966", "phrase": "A young boy in a black leather jacket", "phrase_raw": "[988966]", "_start_idx": 0, "start_idx": 0, "end_idx": 37}, {"annotation_id": "926018", "phrase": "red and gold train", "phrase_raw": "[926018]", "_start_idx": 94, "start_idx": 93, "end_idx": 112}]}, {"image_id": 1425, "sentence": "A large, round sandwich with a combination of cream and fruit filling sits on a white plate on a wooden table, accompanied by a white bowl of sauce.", "sentence_raw": "[8092539] with a combination of cream and fruit filling sits on a white plate on [3947580], accompanied by [10461087] of sauce.", "phrase": [{"annotation_id": "8092539", "phrase": "A large, round sandwich", "phrase_raw": "[8092539]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "3947580", "phrase": "a wooden table", "phrase_raw": "[3947580]", "_start_idx": 95, "start_idx": 94, "end_idx": 109}, {"annotation_id": "10461087", "phrase": "a white bowl", "phrase_raw": "[10461087]", "_start_idx": 126, "start_idx": 125, "end_idx": 138}]}, {"image_id": 1490, "sentence": "A person in a black wetsuit stands on a surfboard in the middle of the calm ocean, under the clear sky, enjoying their time paddling.", "sentence_raw": "[2500134] stands on [13948116] in the middle of [8224125], under [14540253], enjoying their time paddling.", "phrase": [{"annotation_id": "2500134", "phrase": "A person in a black wetsuit", "phrase_raw": "[2500134]", "_start_idx": 0, "start_idx": 0, "end_idx": 27}, {"annotation_id": "13948116", "phrase": "a surfboard", "phrase_raw": "[13948116]", "_start_idx": 38, "start_idx": 37, "end_idx": 49}, {"annotation_id": "8224125", "phrase": "the calm ocean", "phrase_raw": "[8224125]", "_start_idx": 67, "start_idx": 66, "end_idx": 81}, {"annotation_id": "14540253", "phrase": "the clear sky", "phrase_raw": "[14540253]", "_start_idx": 89, "start_idx": 88, "end_idx": 102}]}, {"image_id": 1503, "sentence": "A white laptop computer sitting on a white desk, next to a desktop computer and other electronic devices.", "sentence_raw": "[10393490] sitting on [6515048], next to [entity_id] and other electronic devices.", "phrase": [{"annotation_id": "10393490", "phrase": "A white laptop computer", "phrase_raw": "[10393490]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "6515048", "phrase": "a white desk", "phrase_raw": "[6515048]", "_start_idx": 35, "start_idx": 34, "end_idx": 47}]}, {"image_id": 1532, "sentence": "A white van with a black bumper parked on the side of the busy road, under the clear sky, surrounded by tall buildings.", "sentence_raw": "[7960693] parked on the side of [9739936], under [15123877], surrounded by [6973791].", "phrase": [{"annotation_id": "7960693", "phrase": "A white van with a black bumper", "phrase_raw": "[7960693]", "_start_idx": 0, "start_idx": 0, "end_idx": 31}, {"annotation_id": "9739936", "phrase": "the busy road", "phrase_raw": "[9739936]", "_start_idx": 54, "start_idx": 53, "end_idx": 67}, {"annotation_id": "15123877", "phrase": "the clear sky", "phrase_raw": "[15123877]", "_start_idx": 75, "start_idx": 74, "end_idx": 88}, {"annotation_id": "6973791", "phrase": "tall buildings", "phrase_raw": "[6973791]", "_start_idx": 104, "start_idx": 103, "end_idx": 118}]}, {"image_id": 1584, "sentence": "A red double-decker bus drives down a bustling city street, passing by a black and white bus and numerous pedestrians.", "sentence_raw": "[4207751] drives down a bustling city street, passing by [4669509] and numerous pedestrians.", "phrase": [{"annotation_id": "4207751", "phrase": "A red double-decker bus", "phrase_raw": "[4207751]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "4669509", "phrase": "a black and white bus", "phrase_raw": "[4669509]", "_start_idx": 71, "start_idx": 70, "end_idx": 92}]}, {"image_id": 1675, "sentence": "A black and white cat comfortably curled up inside a sleek, modern laptop keyboard.", "sentence_raw": "[2172198] comfortably curled up inside [6908272].", "phrase": [{"annotation_id": "2172198", "phrase": "A black and white cat", "phrase_raw": "[2172198]", "_start_idx": 0, "start_idx": 0, "end_idx": 21}, {"annotation_id": "6908272", "phrase": "a sleek, modern laptop keyboard", "phrase_raw": "[6908272]", "_start_idx": 51, "start_idx": 50, "end_idx": 82}]}, {"image_id": 1761, "sentence": "A large airplane flying in the sky over a notable bridge with buildings in the background.", "sentence_raw": "[6971996] flying in the sky over [7499631] with [6448230] in the background.", "phrase": [{"annotation_id": "6971996", "phrase": "A large airplane", "phrase_raw": "[6971996]", "_start_idx": 0, "start_idx": 0, "end_idx": 16}, {"annotation_id": "7499631", "phrase": "a notable bridge", "phrase_raw": "[7499631]", "_start_idx": 40, "start_idx": 39, "end_idx": 56}, {"annotation_id": "6448230", "phrase": "buildings", "phrase_raw": "[6448230]", "_start_idx": 62, "start_idx": 61, "end_idx": 71}]}, {"image_id": 1818, "sentence": "A black-and-white striped zebra is grazing in a grassy field, appearing relaxed and at ease.", "sentence_raw": "[8092282] is grazing in [11644848], appearing relaxed and at ease.", "phrase": [{"annotation_id": "8092282", "phrase": "A black-and-white striped zebra", "phrase_raw": "[8092282]", "_start_idx": 0, "start_idx": 0, "end_idx": 31}, {"annotation_id": "11644848", "phrase": "a grassy field", "phrase_raw": "[11644848]", "_start_idx": 46, "start_idx": 45, "end_idx": 60}]}, {"image_id": 1993, "sentence": "In the cozy and inviting bedroom, a black wooden chair sits near a bed with a colorful, patterned bedspread, while a window lets in natural light.", "sentence_raw": "In the cozy and inviting bedroom, [2698543] sits near [6577250], while [10397096] lets in natural light.", "phrase": [{"annotation_id": "2698543", "phrase": "a black wooden chair", "phrase_raw": "[2698543]", "_start_idx": 34, "start_idx": 33, "end_idx": 54}, {"annotation_id": "6577250", "phrase": "a bed with a colorful, patterned bedspread", "phrase_raw": "[6577250]", "_start_idx": 65, "start_idx": 64, "end_idx": 107}, {"annotation_id": "10397096", "phrase": "a window", "phrase_raw": "[10397096]", "_start_idx": 115, "start_idx": 114, "end_idx": 123}]}, {"image_id": 2006, "sentence": "A large purple and white bus drives down a city street, providing public transportation services.", "sentence_raw": "[8282729] drives down [13289674], providing public transportation services.", "phrase": [{"annotation_id": "8282729", "phrase": "A large purple and white bus", "phrase_raw": "[8282729]", "_start_idx": 0, "start_idx": 0, "end_idx": 28}, {"annotation_id": "13289674", "phrase": "a city street", "phrase_raw": "[13289674]", "_start_idx": 41, "start_idx": 40, "end_idx": 54}]}, {"image_id": 2149, "sentence": "A white bowl filled with fresh green apples on a table, ready to be consumed or used in a recipe.", "sentence_raw": "[3639429] filled with [1471850] on a table, ready to be consumed or used in a recipe.", "phrase": [{"annotation_id": "3639429", "phrase": "A white bowl", "phrase_raw": "[3639429]", "_start_idx": 0, "start_idx": 0, "end_idx": 12}, {"annotation_id": "1471850", "phrase": "fresh green apples", "phrase_raw": "[1471850]", "_start_idx": 25, "start_idx": 24, "end_idx": 43}]}, {"image_id": 2153, "sentence": "A baseball player in a blue uniform squatting at home plate, holding a baseball bat and waiting for the pitch on grass field with dirt ground.", "sentence_raw": "[5784894] squatting at home plate, holding [4473413] and waiting for the pitch on [3692098] field with [5136513] ground.", "phrase": [{"annotation_id": "5784894", "phrase": "A baseball player in a blue uniform", "phrase_raw": "[5784894]", "_start_idx": 0, "start_idx": 0, "end_idx": 35}, {"annotation_id": "4473413", "phrase": "a baseball bat", "phrase_raw": "[4473413]", "_start_idx": 69, "start_idx": 68, "end_idx": 83}, {"annotation_id": "3692098", "phrase": "grass", "phrase_raw": "[3692098]", "_start_idx": 113, "start_idx": 112, "end_idx": 118}, {"annotation_id": "5136513", "phrase": "dirt", "phrase_raw": "[5136513]", "_start_idx": 130, "start_idx": 129, "end_idx": 134}]}, {"image_id": 2157, "sentence": "A clear wine glass with a rounded bowl and stem, next to another wine glass and a silver knife with a unique handle, all placed on a table covered with a red tablecloth and a variety of food items.", "sentence_raw": "[5261667] with a rounded bowl and stem, next to [4998986] and [8224410] with a unique handle, all placed on [1907568] covered with a red tablecloth and a variety of food items.", "phrase": [{"annotation_id": "5261667", "phrase": "A clear wine glass", "phrase_raw": "[5261667]", "_start_idx": 0, "start_idx": 0, "end_idx": 18}, {"annotation_id": "4998986", "phrase": "another wine glass", "phrase_raw": "[4998986]", "_start_idx": 57, "start_idx": 56, "end_idx": 75}, {"annotation_id": "8224410", "phrase": "a silver knife", "phrase_raw": "[8224410]", "_start_idx": 80, "start_idx": 79, "end_idx": 94}, {"annotation_id": "1907568", "phrase": "a table", "phrase_raw": "[1907568]", "_start_idx": 131, "start_idx": 130, "end_idx": 138}]}, {"image_id": 2261, "sentence": "A young boy wearing a black shirt rides a surfboard on a green wave in the ocean, showcasing his balance and having fun.", "sentence_raw": "[4539470] wearing a black shirt rides a surfboard on a green wave in the [9086350], showcasing his balance and having fun.", "phrase": [{"annotation_id": "4539470", "phrase": "A young boy", "phrase_raw": "[4539470]", "_start_idx": 0, "start_idx": 0, "end_idx": 11}, {"annotation_id": "9086350", "phrase": "ocean", "phrase_raw": "[9086350]", "_start_idx": 75, "start_idx": 74, "end_idx": 80}]}, {"image_id": 2299, "sentence": "In the black and white photo, a woman in a white shirt and blue cardigan holds a baby, while a young boy in a blue shirt and jeans sits on a chair, and another boy in a black jacket and knee socks sits on the ground, all smiling together.", "sentence_raw": "In the black and white photo, [11711154] holds a baby, while [5789784] sits on a chair, and [4539717] sits on the ground, all smiling together.", "phrase": [{"annotation_id": "11711154", "phrase": "a woman in a white shirt and blue cardigan", "phrase_raw": "[11711154]", "_start_idx": 30, "start_idx": 29, "end_idx": 72}, {"annotation_id": "5789784", "phrase": "a young boy in a blue shirt and jeans", "phrase_raw": "[5789784]", "_start_idx": 93, "start_idx": 92, "end_idx": 130}, {"annotation_id": "4539717", "phrase": "another boy in a black jacket and knee socks", "phrase_raw": "[4539717]", "_start_idx": 152, "start_idx": 151, "end_idx": 196}]}, {"image_id": 2431, "sentence": "A person in black attire and an elegant wine glass on a wooden table with a plate of bread and crackers, creating a casual dining atmosphere.", "sentence_raw": "[657414] and [4473415] on a wooden table with a plate of bread and crackers, creating a casual dining atmosphere.", "phrase": [{"annotation_id": "657414", "phrase": "A person in black attire", "phrase_raw": "[657414]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "4473415", "phrase": "an elegant wine glass", "phrase_raw": "[4473415]", "_start_idx": 29, "start_idx": 28, "end_idx": 50}]}, {"image_id": 2473, "sentence": "A young man in a colorful outfit performs an aerial trick on his snowboard under the blue sky, while a person in a white jacket and striped hat watches nearby among trees on the snow-covered slope.", "sentence_raw": "[9997963] performs an aerial trick on his snowboard under [11759171], while [11444648] watches nearby among [3618868] on the snow-covered slope.", "phrase": [{"annotation_id": "9997963", "phrase": "A young man in a colorful outfit", "phrase_raw": "[9997963]", "_start_idx": 0, "start_idx": 0, "end_idx": 32}, {"annotation_id": "11759171", "phrase": "the blue sky", "phrase_raw": "[11759171]", "_start_idx": 81, "start_idx": 80, "end_idx": 93}, {"annotation_id": "11444648", "phrase": "a person in a white jacket and striped hat", "phrase_raw": "[11444648]", "_start_idx": 101, "start_idx": 100, "end_idx": 143}, {"annotation_id": "3618868", "phrase": "trees", "phrase_raw": "[3618868]", "_start_idx": 165, "start_idx": 164, "end_idx": 170}]}, {"image_id": 2532, "sentence": "A woman in a green shirt and red jacket stands on skis with poles on a snowy slope under the clear blue sky.", "sentence_raw": "[3487018] stands on skis with poles on a [13815752] under the [11107403].", "phrase": [{"annotation_id": "3487018", "phrase": "A woman in a green shirt and red jacket", "phrase_raw": "[3487018]", "_start_idx": 0, "start_idx": 0, "end_idx": 39}, {"annotation_id": "13815752", "phrase": "snowy slope", "phrase_raw": "[13815752]", "_start_idx": 71, "start_idx": 70, "end_idx": 82}, {"annotation_id": "11107403", "phrase": "clear blue sky", "phrase_raw": "[11107403]", "_start_idx": 93, "start_idx": 92, "end_idx": 107}]}, {"image_id": 2587, "sentence": "A yellow banana and a chocolate-covered donut with purple frosting sit together in a plastic bag on a table.", "sentence_raw": "[4884632] and [3821416] sit together in a plastic bag on [1516330].", "phrase": [{"annotation_id": "4884632", "phrase": "A yellow banana", "phrase_raw": "[4884632]", "_start_idx": 0, "start_idx": 0, "end_idx": 15}, {"annotation_id": "3821416", "phrase": "a chocolate-covered donut with purple frosting", "phrase_raw": "[3821416]", "_start_idx": 20, "start_idx": 19, "end_idx": 66}, {"annotation_id": "1516330", "phrase": "a table", "phrase_raw": "[1516330]", "_start_idx": 100, "start_idx": 99, "end_idx": 107}]}, {"image_id": 2592, "sentence": "A sleek, silver knife rests beside a white mug with a pirate skull and crossbones design on a white dining table with a checkered tablecloth.", "sentence_raw": "[3356725] rests beside [11185060] on [8421750].", "phrase": [{"annotation_id": "3356725", "phrase": "A sleek, silver knife", "phrase_raw": "[3356725]", "_start_idx": 0, "start_idx": 0, "end_idx": 21}, {"annotation_id": "11185060", "phrase": "a white mug with a pirate skull and crossbones design", "phrase_raw": "[11185060]", "_start_idx": 35, "start_idx": 34, "end_idx": 88}, {"annotation_id": "8421750", "phrase": "a white dining table with a checkered tablecloth", "phrase_raw": "[8421750]", "_start_idx": 92, "start_idx": 91, "end_idx": 140}]}, {"image_id": 2685, "sentence": "A man in a tan jacket stands behind a wooden bar, surrounded by wine bottles and glasses, while engaging with a shelf nearby.", "sentence_raw": "[3887979] stands behind a wooden bar, surrounded by wine bottles and glasses, while engaging with [4358048] nearby.", "phrase": [{"annotation_id": "3887979", "phrase": "A man in a tan jacket", "phrase_raw": "[3887979]", "_start_idx": 0, "start_idx": 0, "end_idx": 21}, {"annotation_id": "4358048", "phrase": "a shelf", "phrase_raw": "[4358048]", "_start_idx": 110, "start_idx": 109, "end_idx": 117}]}, {"image_id": 2923, "sentence": "A grassy field with a few boats parked on the shore, and some birds walking around, under the overcast sky.", "sentence_raw": "[2974829] with a few [9664623] parked on the shore, and some [12560800] walking around, under the [12492689].", "phrase": [{"annotation_id": "2974829", "phrase": "A grassy field", "phrase_raw": "[2974829]", "_start_idx": 0, "start_idx": 0, "end_idx": 14}, {"annotation_id": "9664623", "phrase": "boats", "phrase_raw": "[9664623]", "_start_idx": 26, "start_idx": 25, "end_idx": 31}, {"annotation_id": "12560800", "phrase": "birds", "phrase_raw": "[12560800]", "_start_idx": 62, "start_idx": 61, "end_idx": 67}, {"annotation_id": "12492689", "phrase": "overcast sky", "phrase_raw": "[12492689]", "_start_idx": 94, "start_idx": 93, "end_idx": 106}]}, {"image_id": 3156, "sentence": "A man in a black shirt kneeling down in front of a white toilet, wearing gloves and working on it.", "sentence_raw": "[3487029] kneeling down in front of [10066329], wearing gloves and working on it.", "phrase": [{"annotation_id": "3487029", "phrase": "A man in a black shirt", "phrase_raw": "[3487029]", "_start_idx": 0, "start_idx": 0, "end_idx": 22}, {"annotation_id": "10066329", "phrase": "a white toilet", "phrase_raw": "[10066329]", "_start_idx": 49, "start_idx": 48, "end_idx": 63}]}, {"image_id": 3255, "sentence": "A mountainous area covered in snowy slopes with a group of people standing, leaving a trail of tracks behind them, indicating they have been skiing or snowboarding under the winter sky.", "sentence_raw": "[9668476] covered in [12696501] with a group of [1644569, 5196619, 2763048, 2105119, 1447190, 1710619] standing, leaving a trail of tracks behind them, indicating they have been skiing or snowboarding under the [10642474].", "phrase": [{"annotation_id": "9668476", "phrase": "A mountainous area", "phrase_raw": "[9668476]", "_start_idx": 0, "start_idx": 0, "end_idx": 18}, {"annotation_id": "12696501", "phrase": "snowy slopes", "phrase_raw": "[12696501]", "_start_idx": 30, "start_idx": 29, "end_idx": 42}, {"annotation_id": "10642474", "phrase": "winter sky", "phrase_raw": "[10642474]", "_start_idx": 174, "start_idx": 173, "end_idx": 184}]}, {"image_id": 3501, "sentence": "A white bowl filled with fresh green broccoli, rice, and a hearty stew on a wooden table.", "sentence_raw": "[9872311] filled with [3633221], rice, and a hearty stew on [2957123].", "phrase": [{"annotation_id": "9872311", "phrase": "A white bowl", "phrase_raw": "[9872311]", "_start_idx": 0, "start_idx": 0, "end_idx": 12}, {"annotation_id": "3633221", "phrase": "fresh green broccoli", "phrase_raw": "[3633221]", "_start_idx": 25, "start_idx": 24, "end_idx": 45}, {"annotation_id": "2957123", "phrase": "a wooden table", "phrase_raw": "[2957123]", "_start_idx": 74, "start_idx": 73, "end_idx": 88}]}, {"image_id": 3553, "sentence": "A person wearing white and black Vans sneakers skillfully balances on a black and white checkered skateboard while performing a trick on a wooden platform in a park, surrounded by grass.", "sentence_raw": "[2829099] skillfully balances on [3686464] while performing a trick on a wooden platform in a park, surrounded by [4220517].", "phrase": [{"annotation_id": "2829099", "phrase": "A person wearing white and black Vans sneakers", "phrase_raw": "[2829099]", "_start_idx": 0, "start_idx": 0, "end_idx": 46}, {"annotation_id": "3686464", "phrase": "a black and white checkered skateboard", "phrase_raw": "[3686464]", "_start_idx": 70, "start_idx": 69, "end_idx": 108}, {"annotation_id": "4220517", "phrase": "grass", "phrase_raw": "[4220517]", "_start_idx": 180, "start_idx": 179, "end_idx": 185}]}, {"image_id": 3661, "sentence": "A ripe and yellow banana with a slightly brown spot on one end, sitting on top of a wooden table next to a blue and white cup with a red handle.", "sentence_raw": "[2782095] with a slightly brown spot on one end, sitting on top of [8299705] next to [13943454] with a red handle.", "phrase": [{"annotation_id": "2782095", "phrase": "A ripe and yellow banana", "phrase_raw": "[2782095]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "8299705", "phrase": "a wooden table", "phrase_raw": "[8299705]", "_start_idx": 82, "start_idx": 81, "end_idx": 96}, {"annotation_id": "13943454", "phrase": "a blue and white cup", "phrase_raw": "[13943454]", "_start_idx": 105, "start_idx": 104, "end_idx": 125}]}, {"image_id": 3845, "sentence": "A wooden dining table holds a delicious meal of vibrant green broccoli, large, orange carrots, chicken, and rice, with a metallic fork nearby.", "sentence_raw": "[4155031] holds a delicious meal of [1532029], [477359], [5989755], and rice, with a [6780294] nearby.", "phrase": [{"annotation_id": "4155031", "phrase": "A wooden dining table", "phrase_raw": "[4155031]", "_start_idx": 0, "start_idx": 0, "end_idx": 21}, {"annotation_id": "1532029", "phrase": "vibrant green broccoli", "phrase_raw": "[1532029]", "_start_idx": 48, "start_idx": 47, "end_idx": 70}, {"annotation_id": "477359", "phrase": "large, orange carrots", "phrase_raw": "[477359]", "_start_idx": 72, "start_idx": 71, "end_idx": 93}, {"annotation_id": "5989755", "phrase": "chicken", "phrase_raw": "[5989755]", "_start_idx": 95, "start_idx": 94, "end_idx": 102}, {"annotation_id": "6780294", "phrase": "metallic fork", "phrase_raw": "[6780294]", "_start_idx": 121, "start_idx": 120, "end_idx": 134}]}, {"image_id": 3934, "sentence": "A young girl wearing a pink and green skirt is playing a video game in front of a wooden floor in a lively living room.", "sentence_raw": "[9866396] wearing a pink and green skirt is playing a video game in front of [2763583] in a lively living room.", "phrase": [{"annotation_id": "9866396", "phrase": "A young girl", "phrase_raw": "[9866396]", "_start_idx": 0, "start_idx": 0, "end_idx": 12}, {"annotation_id": "2763583", "phrase": "a wooden floor", "phrase_raw": "[2763583]", "_start_idx": 80, "start_idx": 79, "end_idx": 94}]}, {"image_id": 4134, "sentence": "A man in a suit and tie shakes hands with another man in a suit and tie at a formal event, while a person in a black suit and tie observes nearby.", "sentence_raw": "[856087] shakes hands with [4801866] at a formal event, while [461071] observes nearby.", "phrase": [{"annotation_id": "856087", "phrase": "A man in a suit and tie", "phrase_raw": "[856087]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "4801866", "phrase": "another man in a suit and tie", "phrase_raw": "[4801866]", "_start_idx": 42, "start_idx": 41, "end_idx": 71}, {"annotation_id": "461071", "phrase": "a person in a black suit and tie", "phrase_raw": "[461071]", "_start_idx": 97, "start_idx": 96, "end_idx": 129}]}, {"image_id": 4395, "sentence": "A man in a yellow shirt and a black tie stands in front of a window, with his hand on his chest, looking at the camera.", "sentence_raw": "[9215908] and [1910308] stands in front of a window, with his hand on his chest, looking at the camera.", "phrase": [{"annotation_id": "9215908", "phrase": "A man in a yellow shirt", "phrase_raw": "[9215908]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "1910308", "phrase": "a black tie", "phrase_raw": "[1910308]", "_start_idx": 28, "start_idx": 27, "end_idx": 39}]}, {"image_id": 4495, "sentence": "In the cozy living room, a large, colorful plaid couch sits near a shelf, providing a comfortable atmosphere.", "sentence_raw": "In the cozy living room, [7752776] sits near [3020832], providing a comfortable atmosphere.", "phrase": [{"annotation_id": "7752776", "phrase": "a large, colorful plaid couch", "phrase_raw": "[7752776]", "_start_idx": 25, "start_idx": 24, "end_idx": 54}, {"annotation_id": "3020832", "phrase": "a shelf", "phrase_raw": "[3020832]", "_start_idx": 65, "start_idx": 64, "end_idx": 72}]}, {"image_id": 4765, "sentence": "A man in a yellow wetsuit skillfully rides a long, white, and blue surfboard on a wave in the ocean.", "sentence_raw": "[6516604] skillfully rides [11582145] on a wave in the ocean.", "phrase": [{"annotation_id": "6516604", "phrase": "A man in a yellow wetsuit", "phrase_raw": "[6516604]", "_start_idx": 0, "start_idx": 0, "end_idx": 25}, {"annotation_id": "11582145", "phrase": "a long, white, and blue surfboard", "phrase_raw": "[11582145]", "_start_idx": 43, "start_idx": 42, "end_idx": 76}]}, {"image_id": 4795, "sentence": "A curious black cat sitting on a desk, observing a laptop computer screen.", "sentence_raw": "[6383217] sitting on a desk, observing [10857645] screen.", "phrase": [{"annotation_id": "6383217", "phrase": "A curious black cat", "phrase_raw": "[6383217]", "_start_idx": 0, "start_idx": 0, "end_idx": 19}, {"annotation_id": "10857645", "phrase": "a laptop computer", "phrase_raw": "[10857645]", "_start_idx": 49, "start_idx": 48, "end_idx": 66}]}, {"image_id": 5001, "sentence": "A person in a striped jacket and hat stands near a man wearing glasses and a plaid shirt, holding a blue balloon, both in front of a wall during a ribbon-cutting ceremony.", "sentence_raw": "[2894634] stands near [5984609], both in front of [3223858] during a ribbon-cutting ceremony.", "phrase": [{"annotation_id": "2894634", "phrase": "A person in a striped jacket and hat", "phrase_raw": "[2894634]", "_start_idx": 0, "start_idx": 0, "end_idx": 36}, {"annotation_id": "5984609", "phrase": "a man wearing glasses and a plaid shirt, holding a blue balloon", "phrase_raw": "[5984609]", "_start_idx": 49, "start_idx": 48, "end_idx": 112}, {"annotation_id": "3223858", "phrase": "a wall", "phrase_raw": "[3223858]", "_start_idx": 131, "start_idx": 130, "end_idx": 137}]}, {"image_id": 5037, "sentence": "A white and blue bus with a pink stripe is driving down a city street, passing by a house and a building.", "sentence_raw": "[6511971] with a pink stripe is driving down [6186101], passing by [6382962] and [5527167].", "phrase": [{"annotation_id": "6511971", "phrase": "A white and blue bus", "phrase_raw": "[6511971]", "_start_idx": 0, "start_idx": 0, "end_idx": 20}, {"annotation_id": "6186101", "phrase": "a city street", "phrase_raw": "[6186101]", "_start_idx": 56, "start_idx": 55, "end_idx": 69}, {"annotation_id": "6382962", "phrase": "a house", "phrase_raw": "[6382962]", "_start_idx": 82, "start_idx": 81, "end_idx": 89}, {"annotation_id": "5527167", "phrase": "a building", "phrase_raw": "[5527167]", "_start_idx": 94, "start_idx": 93, "end_idx": 104}]}, {"image_id": 5060, "sentence": "A man sitting on the wooden floor in front of a large mirror, taking a selfie with his cell phone.", "sentence_raw": "[3884104] sitting on [4812424] in front of [5465719], taking a selfie with [1973018].", "phrase": [{"annotation_id": "3884104", "phrase": "A man", "phrase_raw": "[3884104]", "_start_idx": 0, "start_idx": 0, "end_idx": 5}, {"annotation_id": "4812424", "phrase": "the wooden floor", "phrase_raw": "[4812424]", "_start_idx": 17, "start_idx": 16, "end_idx": 33}, {"annotation_id": "5465719", "phrase": "a large mirror", "phrase_raw": "[5465719]", "_start_idx": 46, "start_idx": 45, "end_idx": 60}, {"annotation_id": "1973018", "phrase": "his cell phone", "phrase_raw": "[1973018]", "_start_idx": 83, "start_idx": 82, "end_idx": 97}]}, {"image_id": 5193, "sentence": "A young man with a beard wearing a red jacket and holding a cell phone, posing with a smiling man holding a colorful surfboard for a picture.", "sentence_raw": "[7966359] wearing a red jacket and holding a cell phone, posing with [2895929] holding [3106707] for a picture.", "phrase": [{"annotation_id": "7966359", "phrase": "A young man with a beard", "phrase_raw": "[7966359]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "2895929", "phrase": "a smiling man", "phrase_raw": "[2895929]", "_start_idx": 84, "start_idx": 83, "end_idx": 97}, {"annotation_id": "3106707", "phrase": "a colorful surfboard", "phrase_raw": "[3106707]", "_start_idx": 106, "start_idx": 105, "end_idx": 126}]}, {"image_id": 5477, "sentence": "A large yellow and white Air France airplane parked on the runway under a cloudy sky.", "sentence_raw": "[5536663] parked on [7965586] under [12366238].", "phrase": [{"annotation_id": "5536663", "phrase": "A large yellow and white Air France airplane", "phrase_raw": "[5536663]", "_start_idx": 0, "start_idx": 0, "end_idx": 44}, {"annotation_id": "7965586", "phrase": "the runway", "phrase_raw": "[7965586]", "_start_idx": 55, "start_idx": 54, "end_idx": 65}, {"annotation_id": "12366238", "phrase": "a cloudy sky", "phrase_raw": "[12366238]", "_start_idx": 72, "start_idx": 71, "end_idx": 84}]}, {"image_id": 5503, "sentence": "A person standing in front of a white toilet in a dimly lit bathroom, with their foot visible in the foreground.", "sentence_raw": "[7368816] standing in front of [7368816] in a dimly lit bathroom, with their foot visible in the foreground.", "phrase": [{"annotation_id": "7368816", "phrase": "A person", "phrase_raw": "[7368816]", "_start_idx": 0, "start_idx": 0, "end_idx": 8}, {"annotation_id": "7368816", "phrase": "a white toilet", "phrase_raw": "[7368816]", "_start_idx": 30, "start_idx": 29, "end_idx": 44}]}, {"image_id": 5529, "sentence": "A person in a blue jacket skiing down a snowy slope with deep, powdery snow surrounding them.", "sentence_raw": "[5920346] skiing down a snowy slope with [11448498] surrounding them.", "phrase": [{"annotation_id": "5920346", "phrase": "A person in a blue jacket", "phrase_raw": "[5920346]", "_start_idx": 0, "start_idx": 0, "end_idx": 25}, {"annotation_id": "11448498", "phrase": "deep, powdery snow", "phrase_raw": "[11448498]", "_start_idx": 57, "start_idx": 56, "end_idx": 75}]}, {"image_id": 5586, "sentence": "A young man in a yellow shirt and black shorts is playing tennis on a blue outdoor court, holding a tennis racket and swinging it.", "sentence_raw": "[5856347] is playing tennis on [9735544], holding [7436416] and swinging it.", "phrase": [{"annotation_id": "5856347", "phrase": "A young man in a yellow shirt and black shorts", "phrase_raw": "[5856347]", "_start_idx": 0, "start_idx": 0, "end_idx": 46}, {"annotation_id": "9735544", "phrase": "a blue outdoor court", "phrase_raw": "[9735544]", "_start_idx": 68, "start_idx": 67, "end_idx": 88}, {"annotation_id": "7436416", "phrase": "a tennis racket", "phrase_raw": "[7436416]", "_start_idx": 98, "start_idx": 97, "end_idx": 113}]}, {"image_id": 5600, "sentence": "A simple and inviting dining table is set with a white tablecloth, featuring a white plate holding a silver bowl filled with colorful vegetables and a bowl of meat.", "sentence_raw": "[1121309] is set with a white tablecloth, featuring a white plate holding [1594007] filled with colorful vegetables and a bowl of meat.", "phrase": [{"annotation_id": "1121309", "phrase": "A simple and inviting dining table", "phrase_raw": "[1121309]", "_start_idx": 0, "start_idx": 0, "end_idx": 34}, {"annotation_id": "1594007", "phrase": "a silver bowl", "phrase_raw": "[1594007]", "_start_idx": 99, "start_idx": 98, "end_idx": 112}]}, {"image_id": 5992, "sentence": "Three fluffy, woolly sheep grazing in a grassy field near a fence and a tree.", "sentence_raw": "[5459531] grazing in a [3887945] near a [8815228] and a [10660769].", "phrase": [{"annotation_id": "5459531", "phrase": "Three fluffy, woolly sheep", "phrase_raw": "[5459531]", "_start_idx": 0, "start_idx": 0, "end_idx": 26}, {"annotation_id": "3887945", "phrase": "grassy field", "phrase_raw": "[3887945]", "_start_idx": 40, "start_idx": 39, "end_idx": 52}, {"annotation_id": "8815228", "phrase": "fence", "phrase_raw": "[8815228]", "_start_idx": 60, "start_idx": 59, "end_idx": 65}, {"annotation_id": "10660769", "phrase": "tree", "phrase_raw": "[10660769]", "_start_idx": 72, "start_idx": 71, "end_idx": 76}]}, {"image_id": 6012, "sentence": "A long, yellow banana with the peel removed lies in the center, while a slightly brown-spotted banana is slightly offset to the side. Both fruits rest on a contrasting blue background.", "sentence_raw": "[2725787] with the peel removed lies in the center, while [2660764] is slightly offset to the side. Both fruits rest on a contrasting blue background.", "phrase": [{"annotation_id": "2725787", "phrase": "A long, yellow banana", "phrase_raw": "[2725787]", "_start_idx": 0, "start_idx": 0, "end_idx": 21}, {"annotation_id": "2660764", "phrase": "a slightly brown-spotted banana", "phrase_raw": "[2660764]", "_start_idx": 70, "start_idx": 69, "end_idx": 101}]}, {"image_id": 6040, "sentence": "A blue and white commuter train travels down the tracks, surrounded by trees in the city.", "sentence_raw": "[7105121] travels down the tracks, surrounded by [1186841] in the city.", "phrase": [{"annotation_id": "7105121", "phrase": "A blue and white commuter train", "phrase_raw": "[7105121]", "_start_idx": 0, "start_idx": 0, "end_idx": 31}, {"annotation_id": "1186841", "phrase": "trees", "phrase_raw": "[1186841]", "_start_idx": 71, "start_idx": 70, "end_idx": 76}]}, {"image_id": 6213, "sentence": "An open shower curtain in a clean bathroom with a large mirror on the brown wall.", "sentence_raw": "[1514056] in a clean bathroom with [5206927] on the [8627133].", "phrase": [{"annotation_id": "1514056", "phrase": "An open shower curtain", "phrase_raw": "[1514056]", "_start_idx": 0, "start_idx": 0, "end_idx": 22}, {"annotation_id": "5206927", "phrase": "a large mirror", "phrase_raw": "[5206927]", "_start_idx": 48, "start_idx": 47, "end_idx": 62}, {"annotation_id": "8627133", "phrase": "brown wall", "phrase_raw": "[8627133]", "_start_idx": 70, "start_idx": 69, "end_idx": 80}]}, {"image_id": 6460, "sentence": "A silhouette of a person skillfully riding a surfboard on a large ocean wave, showcasing their expertise in surfing.", "sentence_raw": "[1973790] skillfully riding a [8553090] on a large [9079434], showcasing their expertise in surfing.", "phrase": [{"annotation_id": "1973790", "phrase": "A silhouette of a person", "phrase_raw": "[1973790]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "8553090", "phrase": "surfboard", "phrase_raw": "[8553090]", "_start_idx": 45, "start_idx": 44, "end_idx": 54}, {"annotation_id": "9079434", "phrase": "ocean wave", "phrase_raw": "[9079434]", "_start_idx": 66, "start_idx": 65, "end_idx": 76}]}, {"image_id": 6471, "sentence": "A baseball player in a black and white uniform holding a bat next to a player in a blue shirt on the field, with the stadium in the background.", "sentence_raw": "[5986648] holding a bat next to [4404533] on the field, with [3682089] in the background.", "phrase": [{"annotation_id": "5986648", "phrase": "A baseball player in a black and white uniform", "phrase_raw": "[5986648]", "_start_idx": 0, "start_idx": 0, "end_idx": 46}, {"annotation_id": "4404533", "phrase": "a player in a blue shirt", "phrase_raw": "[4404533]", "_start_idx": 69, "start_idx": 68, "end_idx": 93}, {"annotation_id": "3682089", "phrase": "the stadium", "phrase_raw": "[3682089]", "_start_idx": 113, "start_idx": 112, "end_idx": 124}]}, {"image_id": 6614, "sentence": "A variety of fruits including a large, round, and vibrant orange arranged on a table.", "sentence_raw": "[11974326] including [15921906] arranged on a table.", "phrase": [{"annotation_id": "11974326", "phrase": "A variety of fruits", "phrase_raw": "[11974326]", "_start_idx": 0, "start_idx": 0, "end_idx": 19}, {"annotation_id": "15921906", "phrase": "a large, round, and vibrant orange", "phrase_raw": "[15921906]", "_start_idx": 30, "start_idx": 29, "end_idx": 64}]}, {"image_id": 6723, "sentence": "A busy city street with cars driving down and buildings lining the sides, featuring a tree near the sidewalk.", "sentence_raw": "[8418677] with cars driving down and buildings lining the sides, featuring [3167056] near the sidewalk.", "phrase": [{"annotation_id": "8418677", "phrase": "A busy city street", "phrase_raw": "[8418677]", "_start_idx": 0, "start_idx": 0, "end_idx": 18}, {"annotation_id": "3167056", "phrase": "a tree", "phrase_raw": "[3167056]", "_start_idx": 84, "start_idx": 83, "end_idx": 90}]}, {"image_id": 6763, "sentence": "A woman in a white shirt is sitting at a table next to a smiling man in a blue shirt, who is wearing a gold-colored tie with white and black stripes.", "sentence_raw": "[2899033] is sitting at a table next to [4609136], who is wearing [2303288].", "phrase": [{"annotation_id": "2899033", "phrase": "A woman in a white shirt", "phrase_raw": "[2899033]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "4609136", "phrase": "a smiling man in a blue shirt", "phrase_raw": "[4609136]", "_start_idx": 55, "start_idx": 54, "end_idx": 84}, {"annotation_id": "2303288", "phrase": "a gold-colored tie with white and black stripes", "phrase_raw": "[2303288]", "_start_idx": 101, "start_idx": 100, "end_idx": 148}]}, {"image_id": 6771, "sentence": "A woman in a costume talks on her cell phone, standing amidst a crowd that includes a man with a beard and a woman with long hair.", "sentence_raw": "[5333115] talks on her cell phone, standing amidst a crowd that includes [3947437] and [4868696].", "phrase": [{"annotation_id": "5333115", "phrase": "A woman in a costume", "phrase_raw": "[5333115]", "_start_idx": 0, "start_idx": 0, "end_idx": 20}, {"annotation_id": "3947437", "phrase": "a man with a beard", "phrase_raw": "[3947437]", "_start_idx": 84, "start_idx": 83, "end_idx": 102}, {"annotation_id": "4868696", "phrase": "a woman with long hair", "phrase_raw": "[4868696]", "_start_idx": 107, "start_idx": 106, "end_idx": 129}]}, {"image_id": 6818, "sentence": "In the small bathroom, there is a white toilet with a lid and a white sink. Two buckets are placed on the tiled floor, one next to the toilet and the other near the sink.", "sentence_raw": "In the [8941399], there is a [8941399] with a lid and a white sink. Two buckets are placed on the [4604215], one next to the [8941399] and the other near the sink.", "phrase": [{"annotation_id": "8941399", "phrase": "small bathroom", "phrase_raw": "[8941399]", "_start_idx": 7, "start_idx": 6, "end_idx": 21}, {"annotation_id": "8941399", "phrase": "white toilet", "phrase_raw": "[8941399]", "_start_idx": 34, "start_idx": 33, "end_idx": 46}, {"annotation_id": "4604215", "phrase": "tiled floor", "phrase_raw": "[4604215]", "_start_idx": 106, "start_idx": 105, "end_idx": 117}, {"annotation_id": "8941399", "phrase": "toilet", "phrase_raw": "[8941399]", "_start_idx": 40, "start_idx": 39, "end_idx": 46}]}, {"image_id": 6894, "sentence": "A bearded man in a tan shirt shares a heartwarming moment with a large gray elephant as they playfully interact in a field under the sky near mountains.", "sentence_raw": "[8751767] shares a heartwarming moment with [5395804] as they playfully interact in a field under [16711165] near [12694940].", "phrase": [{"annotation_id": "8751767", "phrase": "A bearded man in a tan shirt", "phrase_raw": "[8751767]", "_start_idx": 0, "start_idx": 0, "end_idx": 28}, {"annotation_id": "5395804", "phrase": "a large gray elephant", "phrase_raw": "[5395804]", "_start_idx": 63, "start_idx": 62, "end_idx": 84}, {"annotation_id": "16711165", "phrase": "the sky", "phrase_raw": "[16711165]", "_start_idx": 129, "start_idx": 128, "end_idx": 136}, {"annotation_id": "12694940", "phrase": "mountains", "phrase_raw": "[12694940]", "_start_idx": 142, "start_idx": 141, "end_idx": 151}]}, {"image_id": 6954, "sentence": "A young boy in a red shirt and a little girl in a white dress sitting on the grass with two other children in blue clothing, holding frisbees under the sky.", "sentence_raw": "[5921417] and [8620705] sitting on the grass with [6447465], holding frisbees under [16514043].", "phrase": [{"annotation_id": "5921417", "phrase": "A young boy in a red shirt", "phrase_raw": "[5921417]", "_start_idx": 0, "start_idx": 0, "end_idx": 26}, {"annotation_id": "8620705", "phrase": "a little girl in a white dress", "phrase_raw": "[8620705]", "_start_idx": 31, "start_idx": 30, "end_idx": 61}, {"annotation_id": "6447465", "phrase": "two other children in blue clothing", "phrase_raw": "[6447465]", "_start_idx": 88, "start_idx": 87, "end_idx": 123}, {"annotation_id": "16514043", "phrase": "the sky", "phrase_raw": "[16514043]", "_start_idx": 148, "start_idx": 147, "end_idx": 155}]}, {"image_id": 7088, "sentence": "A little girl holding a pink umbrella while standing on a wet sidewalk in a residential area.", "sentence_raw": "[3941741] holding [11374732] while standing on [15461348] in a residential area.", "phrase": [{"annotation_id": "3941741", "phrase": "A little girl", "phrase_raw": "[3941741]", "_start_idx": 0, "start_idx": 0, "end_idx": 13}, {"annotation_id": "11374732", "phrase": "a pink umbrella", "phrase_raw": "[11374732]", "_start_idx": 22, "start_idx": 21, "end_idx": 37}, {"annotation_id": "15461348", "phrase": "a wet sidewalk", "phrase_raw": "[15461348]", "_start_idx": 56, "start_idx": 55, "end_idx": 70}]}, {"image_id": 7108, "sentence": "A baby elephant with a brown and red hue stands in the dirt, surrounded by other elephants, while grass and sand fill the scene in a natural environment.", "sentence_raw": "[3954842] stands in the dirt, surrounded by other elephants, while [5338997] and [8360354] fill the scene in a natural environment.", "phrase": [{"annotation_id": "3954842", "phrase": "A baby elephant with a brown and red hue", "phrase_raw": "[3954842]", "_start_idx": 0, "start_idx": 0, "end_idx": 40}, {"annotation_id": "5338997", "phrase": "grass", "phrase_raw": "[5338997]", "_start_idx": 98, "start_idx": 97, "end_idx": 103}, {"annotation_id": "8360354", "phrase": "sand", "phrase_raw": "[8360354]", "_start_idx": 108, "start_idx": 107, "end_idx": 112}]}, {"image_id": 7278, "sentence": "A man in a wetsuit skillfully rides a white and blue surfboard on a wave in the ocean.", "sentence_raw": "[6973051] skillfully rides [12960199] on a wave in [8685436].", "phrase": [{"annotation_id": "6973051", "phrase": "A man in a wetsuit", "phrase_raw": "[6973051]", "_start_idx": 0, "start_idx": 0, "end_idx": 18}, {"annotation_id": "12960199", "phrase": "a white and blue surfboard", "phrase_raw": "[12960199]", "_start_idx": 36, "start_idx": 35, "end_idx": 62}, {"annotation_id": "8685436", "phrase": "the ocean", "phrase_raw": "[8685436]", "_start_idx": 76, "start_idx": 75, "end_idx": 85}]}, {"image_id": 7281, "sentence": "A large brown horse with a white face and a brown horse with a red ribbon are being ridden by a man and a woman on the sand of a beach, under the sky.", "sentence_raw": "[6777710] and [2305346] are being ridden by a man and a woman on the [8029581] of a beach, under the [14007968].", "phrase": [{"annotation_id": "6777710", "phrase": "A large brown horse with a white face", "phrase_raw": "[6777710]", "_start_idx": 0, "start_idx": 0, "end_idx": 37}, {"annotation_id": "2305346", "phrase": "a brown horse with a red ribbon", "phrase_raw": "[2305346]", "_start_idx": 42, "start_idx": 41, "end_idx": 73}, {"annotation_id": "8029581", "phrase": "sand", "phrase_raw": "[8029581]", "_start_idx": 119, "start_idx": 118, "end_idx": 123}, {"annotation_id": "14007968", "phrase": "sky", "phrase_raw": "[14007968]", "_start_idx": 146, "start_idx": 145, "end_idx": 149}]}, {"image_id": 7386, "sentence": "A silver Chevrolet pickup truck parked in the driveway alongside a vintage-looking three-wheeled motorcycle, while a small, white, and fluffy dog stands on the grass nearby.", "sentence_raw": "[4604474] parked in the driveway alongside [6252397], while [4807530] stands on [4218974] nearby.", "phrase": [{"annotation_id": "4604474", "phrase": "A silver Chevrolet pickup truck", "phrase_raw": "[4604474]", "_start_idx": 0, "start_idx": 0, "end_idx": 31}, {"annotation_id": "6252397", "phrase": "a vintage-looking three-wheeled motorcycle", "phrase_raw": "[6252397]", "_start_idx": 65, "start_idx": 64, "end_idx": 107}, {"annotation_id": "4807530", "phrase": "a small, white, and fluffy dog", "phrase_raw": "[4807530]", "_start_idx": 115, "start_idx": 114, "end_idx": 145}, {"annotation_id": "4218974", "phrase": "the grass", "phrase_raw": "[4218974]", "_start_idx": 156, "start_idx": 155, "end_idx": 165}]}, {"image_id": 7511, "sentence": "A young man in a black shirt and jeans is preparing to fly a kite on the sandy beach near the body of water, while others enjoy various activities.", "sentence_raw": "[3026996] is preparing to fly a kite on the [8227481] near the [8283727], while others enjoy various activities.", "phrase": [{"annotation_id": "3026996", "phrase": "A young man in a black shirt and jeans", "phrase_raw": "[3026996]", "_start_idx": 0, "start_idx": 0, "end_idx": 38}, {"annotation_id": "8227481", "phrase": "sandy beach", "phrase_raw": "[8227481]", "_start_idx": 73, "start_idx": 72, "end_idx": 84}, {"annotation_id": "8283727", "phrase": "body of water", "phrase_raw": "[8283727]", "_start_idx": 94, "start_idx": 93, "end_idx": 107}]}, {"image_id": 7574, "sentence": "A black microwave with a silver handle sits on the large countertop in the clean and well-organized kitchen, surrounded by cardboard and other items.", "sentence_raw": "[3226435] with a silver handle sits on the large [3161413] in the clean and well-organized [5799580], surrounded by [5533553] and other items.", "phrase": [{"annotation_id": "3226435", "phrase": "A black microwave", "phrase_raw": "[3226435]", "_start_idx": 0, "start_idx": 0, "end_idx": 17}, {"annotation_id": "3161413", "phrase": "countertop", "phrase_raw": "[3161413]", "_start_idx": 57, "start_idx": 56, "end_idx": 67}, {"annotation_id": "5799580", "phrase": "kitchen", "phrase_raw": "[5799580]", "_start_idx": 100, "start_idx": 99, "end_idx": 107}, {"annotation_id": "5533553", "phrase": "cardboard", "phrase_raw": "[5533553]", "_start_idx": 123, "start_idx": 122, "end_idx": 132}]}, {"image_id": 7784, "sentence": "A large white and red kite soars high in the blue sky, creating a visually appealing scene.", "sentence_raw": "[8881844] soars high in the [11893582], creating a visually appealing scene.", "phrase": [{"annotation_id": "8881844", "phrase": "A large white and red kite", "phrase_raw": "[8881844]", "_start_idx": 0, "start_idx": 0, "end_idx": 26}, {"annotation_id": "11893582", "phrase": "blue sky", "phrase_raw": "[11893582]", "_start_idx": 45, "start_idx": 44, "end_idx": 53}]}, {"image_id": 7795, "sentence": "A large, white, and black bed with a patterned comforter in a well-decorated bedroom, next to a window allowing natural light to enter, and a cabinet nearby.", "sentence_raw": "[8623005] with a patterned comforter in a well-decorated bedroom, next to [10464177] allowing natural light to enter, and [1580066] nearby.", "phrase": [{"annotation_id": "8623005", "phrase": "A large, white, and black bed", "phrase_raw": "[8623005]", "_start_idx": 0, "start_idx": 0, "end_idx": 29}, {"annotation_id": "10464177", "phrase": "a window", "phrase_raw": "[10464177]", "_start_idx": 94, "start_idx": 93, "end_idx": 102}, {"annotation_id": "1580066", "phrase": "a cabinet", "phrase_raw": "[1580066]", "_start_idx": 140, "start_idx": 139, "end_idx": 149}]}, {"image_id": 7816, "sentence": "A person wearing a white helmet rides a white and green motorcycle on a road surrounded by grassy area, with a crowd of people watching.", "sentence_raw": "[9276804] rides [8882303] on a road surrounded by [4753016], with a crowd of people watching.", "phrase": [{"annotation_id": "9276804", "phrase": "A person wearing a white helmet", "phrase_raw": "[9276804]", "_start_idx": 0, "start_idx": 0, "end_idx": 31}, {"annotation_id": "8882303", "phrase": "a white and green motorcycle", "phrase_raw": "[8882303]", "_start_idx": 38, "start_idx": 37, "end_idx": 66}, {"annotation_id": "4753016", "phrase": "grassy area", "phrase_raw": "[4753016]", "_start_idx": 91, "start_idx": 90, "end_idx": 102}]}, {"image_id": 7818, "sentence": "A black, sleek chair is placed near a well-set dining table with a clear glass vase of white and purple flowers as the centerpiece.", "sentence_raw": "[1250068] is placed near [7697011] with [8887465] of white and purple flowers as the centerpiece.", "phrase": [{"annotation_id": "1250068", "phrase": "A black, sleek chair", "phrase_raw": "[1250068]", "_start_idx": 0, "start_idx": 0, "end_idx": 20}, {"annotation_id": "7697011", "phrase": "a well-set dining table", "phrase_raw": "[7697011]", "_start_idx": 36, "start_idx": 35, "end_idx": 59}, {"annotation_id": "8887465", "phrase": "a clear glass vase", "phrase_raw": "[8887465]", "_start_idx": 65, "start_idx": 64, "end_idx": 83}]}, {"image_id": 7888, "sentence": "A large black and white analog clock stands tall in a field, surrounded by grass and trees under the cloudy sky.", "sentence_raw": "[11579568] stands tall in a field, surrounded by [13355979] and trees under [14540253].", "phrase": [{"annotation_id": "11579568", "phrase": "A large black and white analog clock", "phrase_raw": "[11579568]", "_start_idx": 0, "start_idx": 0, "end_idx": 36}, {"annotation_id": "13355979", "phrase": "grass", "phrase_raw": "[13355979]", "_start_idx": 75, "start_idx": 74, "end_idx": 80}, {"annotation_id": "14540253", "phrase": "the cloudy sky", "phrase_raw": "[14540253]", "_start_idx": 97, "start_idx": 96, "end_idx": 111}]}, {"image_id": 7977, "sentence": "A young man in a black shirt skillfully riding a white skateboard with black wheels on a sidewalk near a park.", "sentence_raw": "[5855070] skillfully riding [8223103] on [10790328] near a park.", "phrase": [{"annotation_id": "5855070", "phrase": "A young man in a black shirt", "phrase_raw": "[5855070]", "_start_idx": 0, "start_idx": 0, "end_idx": 28}, {"annotation_id": "8223103", "phrase": "a white skateboard with black wheels", "phrase_raw": "[8223103]", "_start_idx": 47, "start_idx": 46, "end_idx": 83}, {"annotation_id": "10790328", "phrase": "a sidewalk", "phrase_raw": "[10790328]", "_start_idx": 87, "start_idx": 86, "end_idx": 97}]}, {"image_id": 7991, "sentence": "A vibrant orange carrot and green beans on a white plate placed on a stove, ready for cooking.", "sentence_raw": "[2512052] and green beans on a [4216152] placed on a stove, ready for cooking.", "phrase": [{"annotation_id": "2512052", "phrase": "A vibrant orange carrot", "phrase_raw": "[2512052]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "4216152", "phrase": "white plate", "phrase_raw": "[4216152]", "_start_idx": 45, "start_idx": 44, "end_idx": 56}]}, {"image_id": 8021, "sentence": "A man in a suit and tie stands in front of a large screen, engaging with the audience at a conference. A person with red hair sits nearby, watching the presentation.", "sentence_raw": "[4606360] stands in front of a large screen, engaging with the audience at a conference. [920627] sits nearby, watching the presentation.", "phrase": [{"annotation_id": "4606360", "phrase": "A man in a suit and tie", "phrase_raw": "[4606360]", "_start_idx": 0, "start_idx": 0, "end_idx": 23}, {"annotation_id": "920627", "phrase": "A person with red hair", "phrase_raw": "[920627]", "_start_idx": 103, "start_idx": 102, "end_idx": 125}]}, {"image_id": 8211, "sentence": "A person in a blue shirt and a man in a blue jumpsuit sitting on a curb near a small, black motorcycle on a busy city street with various signs.", "sentence_raw": "[6575450] and [10584960] sitting on a curb near [3158845] on a busy city street with various signs.", "phrase": [{"annotation_id": "6575450", "phrase": "A person in a blue shirt", "phrase_raw": "[6575450]", "_start_idx": 0, "start_idx": 0, "end_idx": 24}, {"annotation_id": "10584960", "phrase": "a man in a blue jumpsuit", "phrase_raw": "[10584960]", "_start_idx": 29, "start_idx": 28, "end_idx": 53}, {"annotation_id": "3158845", "phrase": "a small, black motorcycle", "phrase_raw": "[3158845]", "_start_idx": 77, "start_idx": 76, "end_idx": 102}]}, {"image_id": 8277, "sentence": "A bowl filled with slightly mushy broccoli and cooked broccoli in sauce is served as a healthy meal.", "sentence_raw": "[795690] filled with [1333093] and [1072752] is served as a healthy meal.", "phrase": [{"annotation_id": "795690", "phrase": "A bowl", "phrase_raw": "[795690]", "_start_idx": 0, "start_idx": 0, "end_idx": 6}, {"annotation_id": "1333093", "phrase": "slightly mushy broccoli", "phrase_raw": "[1333093]", "_start_idx": 19, "start_idx": 18, "end_idx": 42}, {"annotation_id": "1072752", "phrase": "cooked broccoli in sauce", "phrase_raw": "[1072752]", "_start_idx": 47, "start_idx": 46, "end_idx": 71}]}, {"image_id": 8532, "sentence": "A stylish man wearing a red, patterned tie and glasses, posing in front of a building with a smile.", "sentence_raw": "[6968923] wearing [3942019] and glasses, posing in front of [7434616] with a smile.", "phrase": [{"annotation_id": "6968923", "phrase": "A stylish man", "phrase_raw": "[6968923]", "_start_idx": 0, "start_idx": 0, "end_idx": 13}, {"annotation_id": "3942019", "phrase": "a red, patterned tie", "phrase_raw": "[3942019]", "_start_idx": 22, "start_idx": 21, "end_idx": 42}, {"annotation_id": "7434616", "phrase": "a building", "phrase_raw": "[7434616]", "_start_idx": 75, "start_idx": 74, "end_idx": 85}]}, {"image_id": 8629, "sentence": "A slice of cheese pizza with mushrooms, onions, and other toppings is placed on a plate, ready to be eaten, alongside another pizza with generous toppings, both showcasing a delicious variety.", "sentence_raw": "[1266812] is placed on a plate, ready to be eaten, alongside [3113384], both showcasing a delicious variety.", "phrase": [{"annotation_id": "1266812", "phrase": "A slice of cheese pizza with mushrooms, onions, and other toppings", "phrase_raw": "[1266812]