k3tikvats
initial commit
8b4d6a8
[
{
"scene_id": "fix_classes_sample_000",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 4 objects: a bench at bottom-center (bbox: x=0.51, y=0.83, w=0.15, h=0.07); a cat at top-right (bbox: x=0.82, y=0.12, w=0.06, h=0.04); a bench at top-right (bbox: x=0.71, y=0.17, w=0.12, h=0.07); a bench at top-left (bbox: x=0.22, y=0.18, w=0.09, h=0.07).",
"objects": [
{
"id": 0,
"class_label": "bench",
"position": "bottom-center",
"bbox": [
0.5056,
0.8329,
0.1463,
0.075
]
},
{
"id": 1,
"class_label": "cat",
"position": "top-right",
"bbox": [
0.8196,
0.1155,
0.063,
0.0442
]
},
{
"id": 2,
"class_label": "bench",
"position": "top-right",
"bbox": [
0.7086,
0.1703,
0.1174,
0.0685
]
},
{
"id": 3,
"class_label": "bench",
"position": "top-left",
"bbox": [
0.2228,
0.1839,
0.0944,
0.0739
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.5056,
0.8329,
0.1463,
0.075
],
"class_label": "bench"
},
{
"id": 1,
"bbox": [
0.8196,
0.1155,
0.063,
0.0442
],
"class_label": "cat"
},
{
"id": 2,
"bbox": [
0.7086,
0.1703,
0.1174,
0.0685
],
"class_label": "bench"
},
{
"id": 3,
"bbox": [
0.2228,
0.1839,
0.0944,
0.0739
],
"class_label": "bench"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2000
},
{
"scene_id": "fix_classes_sample_001",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 6 objects: a person at top-left (bbox: x=0.24, y=0.01, w=0.04, h=0.19); a building at top-right (bbox: x=0.59, y=0.10, w=0.27, h=0.26); a car at middle-right (bbox: x=0.71, y=0.40, w=0.24, h=0.11); a traffic_light at bottom-left (bbox: x=0.13, y=0.80, w=0.04, h=0.08); a traffic_light at bottom-center (bbox: x=0.38, y=0.82, w=0.03, h=0.08); a bicycle at top-right (bbox: x=0.76, y=0.18, w=0.08, h=0.07).",
"objects": [
{
"id": 0,
"class_label": "person",
"position": "top-left",
"bbox": [
0.2387,
0.0135,
0.0435,
0.1902
]
},
{
"id": 1,
"class_label": "building",
"position": "top-right",
"bbox": [
0.5933,
0.0967,
0.274,
0.2632
]
},
{
"id": 2,
"class_label": "car",
"position": "middle-right",
"bbox": [
0.7125,
0.4008,
0.2393,
0.1105
]
},
{
"id": 3,
"class_label": "traffic_light",
"position": "bottom-left",
"bbox": [
0.1316,
0.8023,
0.0385,
0.0789
]
},
{
"id": 4,
"class_label": "traffic_light",
"position": "bottom-center",
"bbox": [
0.3783,
0.8163,
0.025,
0.0849
]
},
{
"id": 5,
"class_label": "bicycle",
"position": "top-right",
"bbox": [
0.7613,
0.1751,
0.0845,
0.0682
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.2387,
0.0135,
0.0435,
0.1902
],
"class_label": "person"
},
{
"id": 1,
"bbox": [
0.5933,
0.0967,
0.274,
0.2632
],
"class_label": "building"
},
{
"id": 2,
"bbox": [
0.7125,
0.4008,
0.2393,
0.1105
],
"class_label": "car"
},
{
"id": 3,
"bbox": [
0.1316,
0.8023,
0.0385,
0.0789
],
"class_label": "traffic_light"
},
{
"id": 4,
"bbox": [
0.3783,
0.8163,
0.025,
0.0849
],
"class_label": "traffic_light"
},
{
"id": 5,
"bbox": [
0.7613,
0.1751,
0.0845,
0.0682
],
"class_label": "bicycle"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2001
},
{
"scene_id": "fix_classes_sample_002",
"scene_type": "urban_street",
"scene_description": "A busy urban street scene with vehicles, pedestrians, and city infrastructure. The scene contains 9 objects: a building at top-center (bbox: x=0.37, y=0.00, w=0.33, h=0.42); a traffic_light at bottom-right (bbox: x=0.76, y=0.74, w=0.03, h=0.06); a building at top-left (bbox: x=0.10, y=0.04, w=0.24, h=0.44); a tree at top-left (bbox: x=0.10, y=0.07, w=0.11, h=0.35); a bench at top-left (bbox: x=0.09, y=0.12, w=0.15, h=0.07); a tree at middle-right (bbox: x=0.70, y=0.39, w=0.11, h=0.16); a bench at bottom-left (bbox: x=0.06, y=0.71, w=0.14, h=0.05); a car at bottom-right (bbox: x=0.63, y=0.68, w=0.20, h=0.14); a building at center (bbox: x=0.35, y=0.43, w=0.15, h=0.21).",
"objects": [
{
"id": 0,
"class_label": "building",
"position": "top-center",
"bbox": [
0.3665,
0.0,
0.3261,
0.4212
]
},
{
"id": 1,
"class_label": "traffic_light",
"position": "bottom-right",
"bbox": [
0.7551,
0.7411,
0.0262,
0.063
]
},
{
"id": 2,
"class_label": "building",
"position": "top-left",
"bbox": [
0.0974,
0.0377,
0.2443,
0.4365
]
},
{
"id": 3,
"class_label": "tree",
"position": "top-left",
"bbox": [
0.0957,
0.0712,
0.1108,
0.3496
]
},
{
"id": 4,
"class_label": "bench",
"position": "top-left",
"bbox": [
0.0904,
0.1155,
0.1497,
0.0736
]
},
{
"id": 5,
"class_label": "tree",
"position": "middle-right",
"bbox": [
0.7024,
0.3879,
0.1109,
0.1578
]
},
{
"id": 6,
"class_label": "bench",
"position": "bottom-left",
"bbox": [
0.0578,
0.7082,
0.1368,
0.0525
]
},
{
"id": 7,
"class_label": "car",
"position": "bottom-right",
"bbox": [
0.6299,
0.6776,
0.1987,
0.1378
]
},
{
"id": 8,
"class_label": "building",
"position": "center",
"bbox": [
0.3465,
0.4349,
0.1549,
0.2102
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.3665,
0.0,
0.3261,
0.4212
],
"class_label": "building"
},
{
"id": 1,
"bbox": [
0.7551,
0.7411,
0.0262,
0.063
],
"class_label": "traffic_light"
},
{
"id": 2,
"bbox": [
0.0974,
0.0377,
0.2443,
0.4365
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.0957,
0.0712,
0.1108,
0.3496
],
"class_label": "tree"
},
{
"id": 4,
"bbox": [
0.0904,
0.1155,
0.1497,
0.0736
],
"class_label": "bench"
},
{
"id": 5,
"bbox": [
0.7024,
0.3879,
0.1109,
0.1578
],
"class_label": "tree"
},
{
"id": 6,
"bbox": [
0.0578,
0.7082,
0.1368,
0.0525
],
"class_label": "bench"
},
{
"id": 7,
"bbox": [
0.6299,
0.6776,
0.1987,
0.1378
],
"class_label": "car"
},
{
"id": 8,
"bbox": [
0.3465,
0.4349,
0.1549,
0.2102
],
"class_label": "building"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2002
},
{
"scene_id": "fix_classes_sample_003",
"scene_type": "urban_street",
"scene_description": "A busy urban street scene with vehicles, pedestrians, and city infrastructure. The scene contains 10 objects: a bicycle at center (bbox: x=0.53, y=0.58, w=0.08, h=0.08); a truck at top-right (bbox: x=0.67, y=0.17, w=0.20, h=0.11); a tree at bottom-center (bbox: x=0.49, y=0.74, w=0.10, h=0.16); a traffic_light at bottom-left (bbox: x=0.15, y=0.85, w=0.03, h=0.08); a car at top-center (bbox: x=0.25, y=0.23, w=0.23, h=0.10); a truck at center (bbox: x=0.41, y=0.34, w=0.19, h=0.14); a car at center (bbox: x=0.28, y=0.52, w=0.17, h=0.13); a bench at bottom-left (bbox: x=0.23, y=0.77, w=0.14, h=0.07); a truck at top-center (bbox: x=0.40, y=0.15, w=0.27, h=0.15); a truck at middle-right (bbox: x=0.74, y=0.33, w=0.24, h=0.10).",
"objects": [
{
"id": 0,
"class_label": "bicycle",
"position": "center",
"bbox": [
0.5303,
0.5776,
0.0784,
0.0839
]
},
{
"id": 1,
"class_label": "truck",
"position": "top-right",
"bbox": [
0.6659,
0.1705,
0.2007,
0.1056
]
},
{
"id": 2,
"class_label": "tree",
"position": "bottom-center",
"bbox": [
0.4939,
0.7367,
0.1045,
0.1556
]
},
{
"id": 3,
"class_label": "traffic_light",
"position": "bottom-left",
"bbox": [
0.1521,
0.8461,
0.0303,
0.0802
]
},
{
"id": 4,
"class_label": "car",
"position": "top-center",
"bbox": [
0.2497,
0.2348,
0.2268,
0.0982
]
},
{
"id": 5,
"class_label": "truck",
"position": "center",
"bbox": [
0.4123,
0.3407,
0.1866,
0.1407
]
},
{
"id": 6,
"class_label": "car",
"position": "center",
"bbox": [
0.2779,
0.5163,
0.1676,
0.1326
]
},
{
"id": 7,
"class_label": "bench",
"position": "bottom-left",
"bbox": [
0.2251,
0.7722,
0.1421,
0.0708
]
},
{
"id": 8,
"class_label": "truck",
"position": "top-center",
"bbox": [
0.4049,
0.1502,
0.27,
0.1525
]
},
{
"id": 9,
"class_label": "truck",
"position": "middle-right",
"bbox": [
0.7383,
0.3254,
0.2445,
0.102
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.5303,
0.5776,
0.0784,
0.0839
],
"class_label": "bicycle"
},
{
"id": 1,
"bbox": [
0.6659,
0.1705,
0.2007,
0.1056
],
"class_label": "truck"
},
{
"id": 2,
"bbox": [
0.4939,
0.7367,
0.1045,
0.1556
],
"class_label": "tree"
},
{
"id": 3,
"bbox": [
0.1521,
0.8461,
0.0303,
0.0802
],
"class_label": "traffic_light"
},
{
"id": 4,
"bbox": [
0.2497,
0.2348,
0.2268,
0.0982
],
"class_label": "car"
},
{
"id": 5,
"bbox": [
0.4123,
0.3407,
0.1866,
0.1407
],
"class_label": "truck"
},
{
"id": 6,
"bbox": [
0.2779,
0.5163,
0.1676,
0.1326
],
"class_label": "car"
},
{
"id": 7,
"bbox": [
0.2251,
0.7722,
0.1421,
0.0708
],
"class_label": "bench"
},
{
"id": 8,
"bbox": [
0.4049,
0.1502,
0.27,
0.1525
],
"class_label": "truck"
},
{
"id": 9,
"bbox": [
0.7383,
0.3254,
0.2445,
0.102
],
"class_label": "truck"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2003
},
{
"scene_id": "fix_classes_sample_004",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 6 objects: a bicycle at middle-left (bbox: x=0.21, y=0.47, w=0.12, h=0.07); a truck at bottom-center (bbox: x=0.53, y=0.79, w=0.17, h=0.14); a building at middle-right (bbox: x=0.66, y=0.21, w=0.33, h=0.31); a building at bottom-center (bbox: x=0.47, y=0.58, w=0.26, h=0.29); a car at middle-left (bbox: x=0.14, y=0.36, w=0.12, h=0.14); a bicycle at middle-right (bbox: x=0.77, y=0.53, w=0.10, h=0.06).",
"objects": [
{
"id": 0,
"class_label": "bicycle",
"position": "middle-left",
"bbox": [
0.2066,
0.4747,
0.1165,
0.0663
]
},
{
"id": 1,
"class_label": "truck",
"position": "bottom-center",
"bbox": [
0.5315,
0.7888,
0.1738,
0.1415
]
},
{
"id": 2,
"class_label": "building",
"position": "middle-right",
"bbox": [
0.6592,
0.2137,
0.3279,
0.3078
]
},
{
"id": 3,
"class_label": "building",
"position": "bottom-center",
"bbox": [
0.4745,
0.5794,
0.2648,
0.2865
]
},
{
"id": 4,
"class_label": "car",
"position": "middle-left",
"bbox": [
0.141,
0.3616,
0.1187,
0.1422
]
},
{
"id": 5,
"class_label": "bicycle",
"position": "middle-right",
"bbox": [
0.7732,
0.5317,
0.0971,
0.0637
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.2066,
0.4747,
0.1165,
0.0663
],
"class_label": "bicycle"
},
{
"id": 1,
"bbox": [
0.5315,
0.7888,
0.1738,
0.1415
],
"class_label": "truck"
},
{
"id": 2,
"bbox": [
0.6592,
0.2137,
0.3279,
0.3078
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.4745,
0.5794,
0.2648,
0.2865
],
"class_label": "building"
},
{
"id": 4,
"bbox": [
0.141,
0.3616,
0.1187,
0.1422
],
"class_label": "car"
},
{
"id": 5,
"bbox": [
0.7732,
0.5317,
0.0971,
0.0637
],
"class_label": "bicycle"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2004
},
{
"scene_id": "fix_classes_sample_005",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 4 objects: a building at bottom-center (bbox: x=0.28, y=0.61, w=0.19, h=0.36); a bench at middle-right (bbox: x=0.67, y=0.35, w=0.11, h=0.08); a building at center (bbox: x=0.28, y=0.36, w=0.18, h=0.26); a tree at bottom-center (bbox: x=0.40, y=0.65, w=0.08, h=0.23).",
"objects": [
{
"id": 0,
"class_label": "building",
"position": "bottom-center",
"bbox": [
0.2832,
0.6082,
0.1919,
0.3621
]
},
{
"id": 1,
"class_label": "bench",
"position": "middle-right",
"bbox": [
0.6689,
0.3473,
0.108,
0.0777
]
},
{
"id": 2,
"class_label": "building",
"position": "center",
"bbox": [
0.2776,
0.363,
0.1827,
0.2616
]
},
{
"id": 3,
"class_label": "tree",
"position": "bottom-center",
"bbox": [
0.4017,
0.6483,
0.083,
0.2308
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.2832,
0.6082,
0.1919,
0.3621
],
"class_label": "building"
},
{
"id": 1,
"bbox": [
0.6689,
0.3473,
0.108,
0.0777
],
"class_label": "bench"
},
{
"id": 2,
"bbox": [
0.2776,
0.363,
0.1827,
0.2616
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.4017,
0.6483,
0.083,
0.2308
],
"class_label": "tree"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2005
},
{
"scene_id": "fix_classes_sample_006",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 9 objects: a car at top-left (bbox: x=0.04, y=0.09, w=0.15, h=0.12); a traffic_light at center (bbox: x=0.57, y=0.37, w=0.02, h=0.08); a building at top-center (bbox: x=0.36, y=0.02, w=0.19, h=0.28); a traffic_light at center (bbox: x=0.39, y=0.50, w=0.03, h=0.09); a traffic_light at middle-left (bbox: x=0.28, y=0.36, w=0.04, h=0.09); a traffic_light at bottom-right (bbox: x=0.79, y=0.84, w=0.04, h=0.06); a bicycle at bottom-center (bbox: x=0.46, y=0.68, w=0.10, h=0.06); a person at bottom-left (bbox: x=0.15, y=0.71, w=0.07, h=0.21); a bicycle at top-right (bbox: x=0.76, y=0.18, w=0.11, h=0.11).",
"objects": [
{
"id": 0,
"class_label": "car",
"position": "top-left",
"bbox": [
0.0395,
0.0896,
0.1485,
0.1193
]
},
{
"id": 1,
"class_label": "traffic_light",
"position": "center",
"bbox": [
0.5714,
0.3689,
0.0238,
0.0825
]
},
{
"id": 2,
"class_label": "building",
"position": "top-center",
"bbox": [
0.3636,
0.0172,
0.1923,
0.2794
]
},
{
"id": 3,
"class_label": "traffic_light",
"position": "center",
"bbox": [
0.388,
0.5003,
0.0281,
0.0921
]
},
{
"id": 4,
"class_label": "traffic_light",
"position": "middle-left",
"bbox": [
0.2751,
0.3626,
0.0376,
0.0865
]
},
{
"id": 5,
"class_label": "traffic_light",
"position": "bottom-right",
"bbox": [
0.7889,
0.8405,
0.0382,
0.062
]
},
{
"id": 6,
"class_label": "bicycle",
"position": "bottom-center",
"bbox": [
0.4596,
0.6833,
0.0983,
0.0632
]
},
{
"id": 7,
"class_label": "person",
"position": "bottom-left",
"bbox": [
0.1547,
0.7105,
0.0734,
0.2081
]
},
{
"id": 8,
"class_label": "bicycle",
"position": "top-right",
"bbox": [
0.7635,
0.1774,
0.109,
0.1099
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.0395,
0.0896,
0.1485,
0.1193
],
"class_label": "car"
},
{
"id": 1,
"bbox": [
0.5714,
0.3689,
0.0238,
0.0825
],
"class_label": "traffic_light"
},
{
"id": 2,
"bbox": [
0.3636,
0.0172,
0.1923,
0.2794
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.388,
0.5003,
0.0281,
0.0921
],
"class_label": "traffic_light"
},
{
"id": 4,
"bbox": [
0.2751,
0.3626,
0.0376,
0.0865
],
"class_label": "traffic_light"
},
{
"id": 5,
"bbox": [
0.7889,
0.8405,
0.0382,
0.062
],
"class_label": "traffic_light"
},
{
"id": 6,
"bbox": [
0.4596,
0.6833,
0.0983,
0.0632
],
"class_label": "bicycle"
},
{
"id": 7,
"bbox": [
0.1547,
0.7105,
0.0734,
0.2081
],
"class_label": "person"
},
{
"id": 8,
"bbox": [
0.7635,
0.1774,
0.109,
0.1099
],
"class_label": "bicycle"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2006
},
{
"scene_id": "fix_classes_sample_007",
"scene_type": "park",
"scene_description": "A peaceful park setting with trees, benches, and people walking their pets. The scene contains 4 objects: a tree at middle-right (bbox: x=0.82, y=0.42, w=0.09, h=0.29); a person at bottom-center (bbox: x=0.41, y=0.80, w=0.06, h=0.14); a bicycle at center (bbox: x=0.46, y=0.57, w=0.10, h=0.10); a cat at bottom-left (bbox: x=0.10, y=0.84, w=0.06, h=0.04).",
"objects": [
{
"id": 0,
"class_label": "tree",
"position": "middle-right",
"bbox": [
0.8209,
0.4194,
0.0916,
0.2923
]
},
{
"id": 1,
"class_label": "person",
"position": "bottom-center",
"bbox": [
0.4122,
0.7975,
0.0569,
0.1439
]
},
{
"id": 2,
"class_label": "bicycle",
"position": "center",
"bbox": [
0.4613,
0.5704,
0.101,
0.1017
]
},
{
"id": 3,
"class_label": "cat",
"position": "bottom-left",
"bbox": [
0.0974,
0.8371,
0.059,
0.0405
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.8209,
0.4194,
0.0916,
0.2923
],
"class_label": "tree"
},
{
"id": 1,
"bbox": [
0.4122,
0.7975,
0.0569,
0.1439
],
"class_label": "person"
},
{
"id": 2,
"bbox": [
0.4613,
0.5704,
0.101,
0.1017
],
"class_label": "bicycle"
},
{
"id": 3,
"bbox": [
0.0974,
0.8371,
0.059,
0.0405
],
"class_label": "cat"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2007
},
{
"scene_id": "fix_classes_sample_008",
"scene_type": "park",
"scene_description": "A peaceful park setting with trees, benches, and people walking their pets. The scene contains 8 objects: a tree at top-center (bbox: x=0.42, y=0.13, w=0.08, h=0.30); a dog at middle-right (bbox: x=0.70, y=0.54, w=0.10, h=0.06); a bench at middle-right (bbox: x=0.69, y=0.44, w=0.12, h=0.07); a bench at bottom-right (bbox: x=0.74, y=0.83, w=0.13, h=0.07); a tree at center (bbox: x=0.36, y=0.20, w=0.14, h=0.34); a bench at center (bbox: x=0.36, y=0.48, w=0.14, h=0.08); a dog at middle-right (bbox: x=0.80, y=0.33, w=0.09, h=0.06); a cat at bottom-right (bbox: x=0.69, y=0.70, w=0.07, h=0.04).",
"objects": [
{
"id": 0,
"class_label": "tree",
"position": "top-center",
"bbox": [
0.4239,
0.1326,
0.0835,
0.2997
]
},
{
"id": 1,
"class_label": "dog",
"position": "middle-right",
"bbox": [
0.6969,
0.5435,
0.095,
0.0583
]
},
{
"id": 2,
"class_label": "bench",
"position": "middle-right",
"bbox": [
0.6949,
0.4408,
0.1195,
0.0735
]
},
{
"id": 3,
"class_label": "bench",
"position": "bottom-right",
"bbox": [
0.7447,
0.8253,
0.129,
0.0687
]
},
{
"id": 4,
"class_label": "tree",
"position": "center",
"bbox": [
0.3559,
0.1987,
0.1441,
0.3361
]
},
{
"id": 5,
"class_label": "bench",
"position": "center",
"bbox": [
0.3611,
0.4825,
0.1362,
0.0758
]
},
{
"id": 6,
"class_label": "dog",
"position": "middle-right",
"bbox": [
0.7964,
0.3324,
0.0896,
0.0571
]
},
{
"id": 7,
"class_label": "cat",
"position": "bottom-right",
"bbox": [
0.6916,
0.7017,
0.0722,
0.0406
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.4239,
0.1326,
0.0835,
0.2997
],
"class_label": "tree"
},
{
"id": 1,
"bbox": [
0.6969,
0.5435,
0.095,
0.0583
],
"class_label": "dog"
},
{
"id": 2,
"bbox": [
0.6949,
0.4408,
0.1195,
0.0735
],
"class_label": "bench"
},
{
"id": 3,
"bbox": [
0.7447,
0.8253,
0.129,
0.0687
],
"class_label": "bench"
},
{
"id": 4,
"bbox": [
0.3559,
0.1987,
0.1441,
0.3361
],
"class_label": "tree"
},
{
"id": 5,
"bbox": [
0.3611,
0.4825,
0.1362,
0.0758
],
"class_label": "bench"
},
{
"id": 6,
"bbox": [
0.7964,
0.3324,
0.0896,
0.0571
],
"class_label": "dog"
},
{
"id": 7,
"bbox": [
0.6916,
0.7017,
0.0722,
0.0406
],
"class_label": "cat"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2008
},
{
"scene_id": "fix_classes_sample_009",
"scene_type": "parking_lot",
"scene_description": "A parking lot with various vehicles and some pedestrians. The scene contains 7 objects: a bicycle at top-left (bbox: x=0.21, y=0.18, w=0.10, h=0.08); a truck at middle-left (bbox: x=0.15, y=0.31, w=0.18, h=0.11); a building at top-left (bbox: x=0.17, y=0.00, w=0.25, h=0.43); a car at bottom-right (bbox: x=0.78, y=0.70, w=0.13, h=0.13); a truck at bottom-center (bbox: x=0.25, y=0.63, w=0.23, h=0.16); a truck at bottom-right (bbox: x=0.66, y=0.76, w=0.21, h=0.14); a bicycle at middle-right (bbox: x=0.69, y=0.54, w=0.10, h=0.08).",
"objects": [
{
"id": 0,
"class_label": "bicycle",
"position": "top-left",
"bbox": [
0.2117,
0.1835,
0.103,
0.0805
]
},
{
"id": 1,
"class_label": "truck",
"position": "middle-left",
"bbox": [
0.1459,
0.3111,
0.1815,
0.1132
]
},
{
"id": 2,
"class_label": "building",
"position": "top-left",
"bbox": [
0.174,
0.0,
0.2485,
0.435
]
},
{
"id": 3,
"class_label": "car",
"position": "bottom-right",
"bbox": [
0.7804,
0.6997,
0.1347,
0.1293
]
},
{
"id": 4,
"class_label": "truck",
"position": "bottom-center",
"bbox": [
0.2522,
0.6274,
0.2337,
0.1615
]
},
{
"id": 5,
"class_label": "truck",
"position": "bottom-right",
"bbox": [
0.6556,
0.7558,
0.2137,
0.1417
]
},
{
"id": 6,
"class_label": "bicycle",
"position": "middle-right",
"bbox": [
0.6948,
0.5434,
0.0959,
0.0783
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.2117,
0.1835,
0.103,
0.0805
],
"class_label": "bicycle"
},
{
"id": 1,
"bbox": [
0.1459,
0.3111,
0.1815,
0.1132
],
"class_label": "truck"
},
{
"id": 2,
"bbox": [
0.174,
0.0,
0.2485,
0.435
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.7804,
0.6997,
0.1347,
0.1293
],
"class_label": "car"
},
{
"id": 4,
"bbox": [
0.2522,
0.6274,
0.2337,
0.1615
],
"class_label": "truck"
},
{
"id": 5,
"bbox": [
0.6556,
0.7558,
0.2137,
0.1417
],
"class_label": "truck"
},
{
"id": 6,
"bbox": [
0.6948,
0.5434,
0.0959,
0.0783
],
"class_label": "bicycle"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2009
},
{
"scene_id": "fix_classes_sample_010",
"scene_type": "park",
"scene_description": "A peaceful park setting with trees, benches, and people walking their pets. The scene contains 7 objects: a tree at middle-left (bbox: x=0.21, y=0.53, w=0.12, h=0.24); a dog at middle-left (bbox: x=0.23, y=0.49, w=0.08, h=0.05); a tree at top-right (bbox: x=0.80, y=0.02, w=0.12, h=0.25); a person at center (bbox: x=0.51, y=0.56, w=0.07, h=0.13); a dog at top-right (bbox: x=0.72, y=0.09, w=0.08, h=0.06); a person at top-center (bbox: x=0.49, y=0.15, w=0.06, h=0.11); a cat at top-right (bbox: x=0.85, y=0.15, w=0.08, h=0.05).",
"objects": [
{
"id": 0,
"class_label": "tree",
"position": "middle-left",
"bbox": [
0.2105,
0.5267,
0.1244,
0.2376
]
},
{
"id": 1,
"class_label": "dog",
"position": "middle-left",
"bbox": [
0.234,
0.4853,
0.0755,
0.0498
]
},
{
"id": 2,
"class_label": "tree",
"position": "top-right",
"bbox": [
0.7951,
0.02,
0.1234,
0.2492
]
},
{
"id": 3,
"class_label": "person",
"position": "center",
"bbox": [
0.5138,
0.5605,
0.066,
0.13
]
},
{
"id": 4,
"class_label": "dog",
"position": "top-right",
"bbox": [
0.7177,
0.0884,
0.0795,
0.0552
]
},
{
"id": 5,
"class_label": "person",
"position": "top-center",
"bbox": [
0.4942,
0.1475,
0.0587,
0.1118
]
},
{
"id": 6,
"class_label": "cat",
"position": "top-right",
"bbox": [
0.8479,
0.1488,
0.0791,
0.051
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.2105,
0.5267,
0.1244,
0.2376
],
"class_label": "tree"
},
{
"id": 1,
"bbox": [
0.234,
0.4853,
0.0755,
0.0498
],
"class_label": "dog"
},
{
"id": 2,
"bbox": [
0.7951,
0.02,
0.1234,
0.2492
],
"class_label": "tree"
},
{
"id": 3,
"bbox": [
0.5138,
0.5605,
0.066,
0.13
],
"class_label": "person"
},
{
"id": 4,
"bbox": [
0.7177,
0.0884,
0.0795,
0.0552
],
"class_label": "dog"
},
{
"id": 5,
"bbox": [
0.4942,
0.1475,
0.0587,
0.1118
],
"class_label": "person"
},
{
"id": 6,
"bbox": [
0.8479,
0.1488,
0.0791,
0.051
],
"class_label": "cat"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2010
},
{
"scene_id": "fix_classes_sample_011",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 10 objects: a building at middle-left (bbox: x=0.13, y=0.43, w=0.31, h=0.24); a car at center (bbox: x=0.44, y=0.55, w=0.24, h=0.14); a truck at middle-right (bbox: x=0.69, y=0.29, w=0.21, h=0.14); a building at center (bbox: x=0.43, y=0.32, w=0.34, h=0.30); a building at bottom-right (bbox: x=0.62, y=0.64, w=0.26, h=0.36); a bicycle at top-left (bbox: x=0.21, y=0.09, w=0.10, h=0.09); a car at bottom-center (bbox: x=0.54, y=0.79, w=0.17, h=0.12); a traffic_light at bottom-left (bbox: x=0.18, y=0.80, w=0.04, h=0.08); a truck at middle-left (bbox: x=0.13, y=0.40, w=0.26, h=0.14); a building at middle-left (bbox: x=0.09, y=0.23, w=0.34, h=0.29).",
"objects": [
{
"id": 0,
"class_label": "building",
"position": "middle-left",
"bbox": [
0.1257,
0.4257,
0.3114,
0.2419
]
},
{
"id": 1,
"class_label": "car",
"position": "center",
"bbox": [
0.4392,
0.5532,
0.2361,
0.1388
]
},
{
"id": 2,
"class_label": "truck",
"position": "middle-right",
"bbox": [
0.6866,
0.2854,
0.2109,
0.1409
]
},
{
"id": 3,
"class_label": "building",
"position": "center",
"bbox": [
0.4317,
0.3189,
0.3353,
0.2953
]
},
{
"id": 4,
"class_label": "building",
"position": "bottom-right",
"bbox": [
0.6194,
0.6385,
0.255,
0.3615
]
},
{
"id": 5,
"class_label": "bicycle",
"position": "top-left",
"bbox": [
0.2083,
0.0889,
0.0952,
0.0946
]
},
{
"id": 6,
"class_label": "car",
"position": "bottom-center",
"bbox": [
0.5437,
0.7863,
0.1666,
0.1211
]
},
{
"id": 7,
"class_label": "traffic_light",
"position": "bottom-left",
"bbox": [
0.1784,
0.7972,
0.0375,
0.0809
]
},
{
"id": 8,
"class_label": "truck",
"position": "middle-left",
"bbox": [
0.1301,
0.4007,
0.2577,
0.1387
]
},
{
"id": 9,
"class_label": "building",
"position": "middle-left",
"bbox": [
0.0883,
0.2262,
0.3353,
0.2883
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.1257,
0.4257,
0.3114,
0.2419
],
"class_label": "building"
},
{
"id": 1,
"bbox": [
0.4392,
0.5532,
0.2361,
0.1388
],
"class_label": "car"
},
{
"id": 2,
"bbox": [
0.6866,
0.2854,
0.2109,
0.1409
],
"class_label": "truck"
},
{
"id": 3,
"bbox": [
0.4317,
0.3189,
0.3353,
0.2953
],
"class_label": "building"
},
{
"id": 4,
"bbox": [
0.6194,
0.6385,
0.255,
0.3615
],
"class_label": "building"
},
{
"id": 5,
"bbox": [
0.2083,
0.0889,
0.0952,
0.0946
],
"class_label": "bicycle"
},
{
"id": 6,
"bbox": [
0.5437,
0.7863,
0.1666,
0.1211
],
"class_label": "car"
},
{
"id": 7,
"bbox": [
0.1784,
0.7972,
0.0375,
0.0809
],
"class_label": "traffic_light"
},
{
"id": 8,
"bbox": [
0.1301,
0.4007,
0.2577,
0.1387
],
"class_label": "truck"
},
{
"id": 9,
"bbox": [
0.0883,
0.2262,
0.3353,
0.2883
],
"class_label": "building"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2011
},
{
"scene_id": "fix_classes_sample_012",
"scene_type": "urban_street",
"scene_description": "A busy urban street scene with vehicles, pedestrians, and city infrastructure. The scene contains 8 objects: a building at middle-left (bbox: x=0.16, y=0.44, w=0.22, h=0.20); a traffic_light at middle-right (bbox: x=0.77, y=0.38, w=0.03, h=0.07); a bench at center (bbox: x=0.45, y=0.58, w=0.14, h=0.06); a traffic_light at bottom-right (bbox: x=0.81, y=0.84, w=0.03, h=0.07); a tree at top-left (bbox: x=0.13, y=0.08, w=0.08, h=0.18); a tree at bottom-center (bbox: x=0.47, y=0.73, w=0.09, h=0.27); a tree at bottom-right (bbox: x=0.82, y=0.71, w=0.12, h=0.29); a tree at middle-right (bbox: x=0.83, y=0.51, w=0.13, h=0.24).",
"objects": [
{
"id": 0,
"class_label": "building",
"position": "middle-left",
"bbox": [
0.1595,
0.436,
0.2157,
0.2025
]
},
{
"id": 1,
"class_label": "traffic_light",
"position": "middle-right",
"bbox": [
0.7682,
0.3769,
0.0295,
0.071
]
},
{
"id": 2,
"class_label": "bench",
"position": "center",
"bbox": [
0.4516,
0.5774,
0.1402,
0.0622
]
},
{
"id": 3,
"class_label": "traffic_light",
"position": "bottom-right",
"bbox": [
0.8113,
0.8356,
0.0273,
0.0717
]
},
{
"id": 4,
"class_label": "tree",
"position": "top-left",
"bbox": [
0.1348,
0.0786,
0.0823,
0.1845
]
},
{
"id": 5,
"class_label": "tree",
"position": "bottom-center",
"bbox": [
0.4715,
0.733,
0.0878,
0.267
]
},
{
"id": 6,
"class_label": "tree",
"position": "bottom-right",
"bbox": [
0.8165,
0.7099,
0.1157,
0.2901
]
},
{
"id": 7,
"class_label": "tree",
"position": "middle-right",
"bbox": [
0.8317,
0.5051,
0.1325,
0.2409
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.1595,
0.436,
0.2157,
0.2025
],
"class_label": "building"
},
{
"id": 1,
"bbox": [
0.7682,
0.3769,
0.0295,
0.071
],
"class_label": "traffic_light"
},
{
"id": 2,
"bbox": [
0.4516,
0.5774,
0.1402,
0.0622
],
"class_label": "bench"
},
{
"id": 3,
"bbox": [
0.8113,
0.8356,
0.0273,
0.0717
],
"class_label": "traffic_light"
},
{
"id": 4,
"bbox": [
0.1348,
0.0786,
0.0823,
0.1845
],
"class_label": "tree"
},
{
"id": 5,
"bbox": [
0.4715,
0.733,
0.0878,
0.267
],
"class_label": "tree"
},
{
"id": 6,
"bbox": [
0.8165,
0.7099,
0.1157,
0.2901
],
"class_label": "tree"
},
{
"id": 7,
"bbox": [
0.8317,
0.5051,
0.1325,
0.2409
],
"class_label": "tree"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2012
},
{
"scene_id": "fix_classes_sample_013",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 4 objects: a bench at bottom-left (bbox: x=0.20, y=0.78, w=0.14, h=0.06); a car at bottom-left (bbox: x=0.18, y=0.69, w=0.22, h=0.13); a cat at top-left (bbox: x=0.23, y=0.12, w=0.04, h=0.05); a car at bottom-right (bbox: x=0.70, y=0.72, w=0.12, h=0.14).",
"objects": [
{
"id": 0,
"class_label": "bench",
"position": "bottom-left",
"bbox": [
0.1999,
0.7841,
0.1363,
0.0602
]
},
{
"id": 1,
"class_label": "car",
"position": "bottom-left",
"bbox": [
0.182,
0.6876,
0.2152,
0.1323
]
},
{
"id": 2,
"class_label": "cat",
"position": "top-left",
"bbox": [
0.2317,
0.124,
0.0444,
0.0495
]
},
{
"id": 3,
"class_label": "car",
"position": "bottom-right",
"bbox": [
0.7013,
0.717,
0.1208,
0.1421
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.1999,
0.7841,
0.1363,
0.0602
],
"class_label": "bench"
},
{
"id": 1,
"bbox": [
0.182,
0.6876,
0.2152,
0.1323
],
"class_label": "car"
},
{
"id": 2,
"bbox": [
0.2317,
0.124,
0.0444,
0.0495
],
"class_label": "cat"
},
{
"id": 3,
"bbox": [
0.7013,
0.717,
0.1208,
0.1421
],
"class_label": "car"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2013
},
{
"scene_id": "fix_classes_sample_014",
"scene_type": "parking_lot",
"scene_description": "A parking lot with various vehicles and some pedestrians. The scene contains 11 objects: a truck at middle-right (bbox: x=0.69, y=0.29, w=0.29, h=0.13); a bicycle at middle-right (bbox: x=0.86, y=0.43, w=0.07, h=0.10); a bicycle at middle-left (bbox: x=0.11, y=0.39, w=0.08, h=0.07); a person at bottom-left (bbox: x=0.14, y=0.66, w=0.06, h=0.16); a person at top-left (bbox: x=0.13, y=0.19, w=0.06, h=0.16); a car at bottom-right (bbox: x=0.81, y=0.78, w=0.10, h=0.09); a person at middle-right (bbox: x=0.69, y=0.32, w=0.06, h=0.19); a truck at top-center (bbox: x=0.31, y=0.15, w=0.15, h=0.12); a car at top-left (bbox: x=0.02, y=0.23, w=0.22, h=0.09); a car at bottom-left (bbox: x=0.08, y=0.71, w=0.21, h=0.13); a bicycle at bottom-center (bbox: x=0.46, y=0.73, w=0.07, h=0.08).",
"objects": [
{
"id": 0,
"class_label": "truck",
"position": "middle-right",
"bbox": [
0.6928,
0.2898,
0.291,
0.1342
]
},
{
"id": 1,
"class_label": "bicycle",
"position": "middle-right",
"bbox": [
0.8609,
0.4331,
0.0675,
0.1006
]
},
{
"id": 2,
"class_label": "bicycle",
"position": "middle-left",
"bbox": [
0.1109,
0.3853,
0.0755,
0.0655
]
},
{
"id": 3,
"class_label": "person",
"position": "bottom-left",
"bbox": [
0.1435,
0.655,
0.0563,
0.1599
]
},
{
"id": 4,
"class_label": "person",
"position": "top-left",
"bbox": [
0.1256,
0.1887,
0.0592,
0.1575
]
},
{
"id": 5,
"class_label": "car",
"position": "bottom-right",
"bbox": [
0.8144,
0.7808,
0.1028,
0.0945
]
},
{
"id": 6,
"class_label": "person",
"position": "middle-right",
"bbox": [
0.691,
0.3242,
0.0615,
0.1868
]
},
{
"id": 7,
"class_label": "truck",
"position": "top-center",
"bbox": [
0.3052,
0.1515,
0.1526,
0.1199
]
},
{
"id": 8,
"class_label": "car",
"position": "top-left",
"bbox": [
0.0238,
0.2273,
0.2191,
0.0936
]
},
{
"id": 9,
"class_label": "car",
"position": "bottom-left",
"bbox": [
0.0832,
0.7148,
0.2069,
0.1275
]
},
{
"id": 10,
"class_label": "bicycle",
"position": "bottom-center",
"bbox": [
0.4554,
0.7334,
0.0684,
0.0751
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.6928,
0.2898,
0.291,
0.1342
],
"class_label": "truck"
},
{
"id": 1,
"bbox": [
0.8609,
0.4331,
0.0675,
0.1006
],
"class_label": "bicycle"
},
{
"id": 2,
"bbox": [
0.1109,
0.3853,
0.0755,
0.0655
],
"class_label": "bicycle"
},
{
"id": 3,
"bbox": [
0.1435,
0.655,
0.0563,
0.1599
],
"class_label": "person"
},
{
"id": 4,
"bbox": [
0.1256,
0.1887,
0.0592,
0.1575
],
"class_label": "person"
},
{
"id": 5,
"bbox": [
0.8144,
0.7808,
0.1028,
0.0945
],
"class_label": "car"
},
{
"id": 6,
"bbox": [
0.691,
0.3242,
0.0615,
0.1868
],
"class_label": "person"
},
{
"id": 7,
"bbox": [
0.3052,
0.1515,
0.1526,
0.1199
],
"class_label": "truck"
},
{
"id": 8,
"bbox": [
0.0238,
0.2273,
0.2191,
0.0936
],
"class_label": "car"
},
{
"id": 9,
"bbox": [
0.0832,
0.7148,
0.2069,
0.1275
],
"class_label": "car"
},
{
"id": 10,
"bbox": [
0.4554,
0.7334,
0.0684,
0.0751
],
"class_label": "bicycle"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2014
},
{
"scene_id": "fix_classes_sample_015",
"scene_type": "urban_street",
"scene_description": "A busy urban street scene with vehicles, pedestrians, and city infrastructure. The scene contains 10 objects: a car at top-right (bbox: x=0.75, y=0.14, w=0.21, h=0.13); a person at bottom-left (bbox: x=0.19, y=0.67, w=0.07, h=0.10); a traffic_light at top-left (bbox: x=0.21, y=0.16, w=0.03, h=0.10); a bench at bottom-left (bbox: x=0.11, y=0.67, w=0.09, h=0.07); a person at top-center (bbox: x=0.46, y=0.06, w=0.06, h=0.12); a truck at top-right (bbox: x=0.71, y=0.16, w=0.25, h=0.13); a tree at bottom-center (bbox: x=0.47, y=0.65, w=0.15, h=0.35); a car at top-right (bbox: x=0.77, y=0.07, w=0.17, h=0.12); a traffic_light at center (bbox: x=0.60, y=0.56, w=0.04, h=0.07); a tree at bottom-right (bbox: x=0.86, y=0.60, w=0.08, h=0.29).",
"objects": [
{
"id": 0,
"class_label": "car",
"position": "top-right",
"bbox": [
0.7536,
0.1368,
0.2118,
0.1311
]
},
{
"id": 1,
"class_label": "person",
"position": "bottom-left",
"bbox": [
0.1931,
0.6707,
0.0699,
0.1047
]
},
{
"id": 2,
"class_label": "traffic_light",
"position": "top-left",
"bbox": [
0.2108,
0.1594,
0.032,
0.0961
]
},
{
"id": 3,
"class_label": "bench",
"position": "bottom-left",
"bbox": [
0.1129,
0.6698,
0.0884,
0.0664
]
},
{
"id": 4,
"class_label": "person",
"position": "top-center",
"bbox": [
0.4649,
0.0567,
0.0568,
0.1179
]
},
{
"id": 5,
"class_label": "truck",
"position": "top-right",
"bbox": [
0.7132,
0.1596,
0.2483,
0.1285
]
},
{
"id": 6,
"class_label": "tree",
"position": "bottom-center",
"bbox": [
0.4742,
0.6523,
0.1469,
0.3477
]
},
{
"id": 7,
"class_label": "car",
"position": "top-right",
"bbox": [
0.7703,
0.0656,
0.172,
0.1152
]
},
{
"id": 8,
"class_label": "traffic_light",
"position": "center",
"bbox": [
0.6037,
0.5574,
0.0351,
0.0652
]
},
{
"id": 9,
"class_label": "tree",
"position": "bottom-right",
"bbox": [
0.8551,
0.6026,
0.0804,
0.2926
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.7536,
0.1368,
0.2118,
0.1311
],
"class_label": "car"
},
{
"id": 1,
"bbox": [
0.1931,
0.6707,
0.0699,
0.1047
],
"class_label": "person"
},
{
"id": 2,
"bbox": [
0.2108,
0.1594,
0.032,
0.0961
],
"class_label": "traffic_light"
},
{
"id": 3,
"bbox": [
0.1129,
0.6698,
0.0884,
0.0664
],
"class_label": "bench"
},
{
"id": 4,
"bbox": [
0.4649,
0.0567,
0.0568,
0.1179
],
"class_label": "person"
},
{
"id": 5,
"bbox": [
0.7132,
0.1596,
0.2483,
0.1285
],
"class_label": "truck"
},
{
"id": 6,
"bbox": [
0.4742,
0.6523,
0.1469,
0.3477
],
"class_label": "tree"
},
{
"id": 7,
"bbox": [
0.7703,
0.0656,
0.172,
0.1152
],
"class_label": "car"
},
{
"id": 8,
"bbox": [
0.6037,
0.5574,
0.0351,
0.0652
],
"class_label": "traffic_light"
},
{
"id": 9,
"bbox": [
0.8551,
0.6026,
0.0804,
0.2926
],
"class_label": "tree"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2015
},
{
"scene_id": "fix_classes_sample_016",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 8 objects: a bench at center (bbox: x=0.49, y=0.56, w=0.14, h=0.08); a tree at top-center (bbox: x=0.30, y=0.00, w=0.15, h=0.33); a person at middle-left (bbox: x=0.17, y=0.56, w=0.05, h=0.14); a person at top-center (bbox: x=0.40, y=0.20, w=0.07, h=0.18); a bench at top-left (bbox: x=0.13, y=0.07, w=0.10, h=0.08); a car at top-center (bbox: x=0.33, y=0.16, w=0.15, h=0.11); a car at middle-left (bbox: x=0.12, y=0.40, w=0.23, h=0.10); a car at bottom-right (bbox: x=0.79, y=0.78, w=0.11, h=0.11).",
"objects": [
{
"id": 0,
"class_label": "bench",
"position": "center",
"bbox": [
0.4902,
0.5556,
0.142,
0.0787
]
},
{
"id": 1,
"class_label": "tree",
"position": "top-center",
"bbox": [
0.3043,
0.0,
0.1483,
0.333
]
},
{
"id": 2,
"class_label": "person",
"position": "middle-left",
"bbox": [
0.1722,
0.5594,
0.054,
0.1359
]
},
{
"id": 3,
"class_label": "person",
"position": "top-center",
"bbox": [
0.3956,
0.2031,
0.0692,
0.1843
]
},
{
"id": 4,
"class_label": "bench",
"position": "top-left",
"bbox": [
0.1348,
0.065,
0.1009,
0.0764
]
},
{
"id": 5,
"class_label": "car",
"position": "top-center",
"bbox": [
0.3291,
0.161,
0.1452,
0.1115
]
},
{
"id": 6,
"class_label": "car",
"position": "middle-left",
"bbox": [
0.1194,
0.4049,
0.2295,
0.1046
]
},
{
"id": 7,
"class_label": "car",
"position": "bottom-right",
"bbox": [
0.7871,
0.7794,
0.1093,
0.1142
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.4902,
0.5556,
0.142,
0.0787
],
"class_label": "bench"
},
{
"id": 1,
"bbox": [
0.3043,
0.0,
0.1483,
0.333
],
"class_label": "tree"
},
{
"id": 2,
"bbox": [
0.1722,
0.5594,
0.054,
0.1359
],
"class_label": "person"
},
{
"id": 3,
"bbox": [
0.3956,
0.2031,
0.0692,
0.1843
],
"class_label": "person"
},
{
"id": 4,
"bbox": [
0.1348,
0.065,
0.1009,
0.0764
],
"class_label": "bench"
},
{
"id": 5,
"bbox": [
0.3291,
0.161,
0.1452,
0.1115
],
"class_label": "car"
},
{
"id": 6,
"bbox": [
0.1194,
0.4049,
0.2295,
0.1046
],
"class_label": "car"
},
{
"id": 7,
"bbox": [
0.7871,
0.7794,
0.1093,
0.1142
],
"class_label": "car"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2016
},
{
"scene_id": "fix_classes_sample_017",
"scene_type": "park",
"scene_description": "A peaceful park setting with trees, benches, and people walking their pets. The scene contains 7 objects: a cat at middle-right (bbox: x=0.67, y=0.48, w=0.08, h=0.05); a bench at top-center (bbox: x=0.52, y=0.17, w=0.10, h=0.07); a dog at top-left (bbox: x=0.10, y=0.22, w=0.09, h=0.07); a dog at top-right (bbox: x=0.77, y=0.27, w=0.06, h=0.05); a bicycle at bottom-right (bbox: x=0.78, y=0.81, w=0.08, h=0.11); a cat at middle-left (bbox: x=0.21, y=0.47, w=0.07, h=0.07); a bench at middle-right (bbox: x=0.66, y=0.51, w=0.13, h=0.05).",
"objects": [
{
"id": 0,
"class_label": "cat",
"position": "middle-right",
"bbox": [
0.6734,
0.4807,
0.0799,
0.0463
]
},
{
"id": 1,
"class_label": "bench",
"position": "top-center",
"bbox": [
0.519,
0.1714,
0.0967,
0.068
]
},
{
"id": 2,
"class_label": "dog",
"position": "top-left",
"bbox": [
0.1046,
0.2152,
0.0886,
0.0742
]
},
{
"id": 3,
"class_label": "dog",
"position": "top-right",
"bbox": [
0.7723,
0.2724,
0.0638,
0.0494
]
},
{
"id": 4,
"class_label": "bicycle",
"position": "bottom-right",
"bbox": [
0.7763,
0.8125,
0.0834,
0.1114
]
},
{
"id": 5,
"class_label": "cat",
"position": "middle-left",
"bbox": [
0.2058,
0.4687,
0.0715,
0.0665
]
},
{
"id": 6,
"class_label": "bench",
"position": "middle-right",
"bbox": [
0.6631,
0.5102,
0.1292,
0.0519
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.6734,
0.4807,
0.0799,
0.0463
],
"class_label": "cat"
},
{
"id": 1,
"bbox": [
0.519,
0.1714,
0.0967,
0.068
],
"class_label": "bench"
},
{
"id": 2,
"bbox": [
0.1046,
0.2152,
0.0886,
0.0742
],
"class_label": "dog"
},
{
"id": 3,
"bbox": [
0.7723,
0.2724,
0.0638,
0.0494
],
"class_label": "dog"
},
{
"id": 4,
"bbox": [
0.7763,
0.8125,
0.0834,
0.1114
],
"class_label": "bicycle"
},
{
"id": 5,
"bbox": [
0.2058,
0.4687,
0.0715,
0.0665
],
"class_label": "cat"
},
{
"id": 6,
"bbox": [
0.6631,
0.5102,
0.1292,
0.0519
],
"class_label": "bench"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2017
},
{
"scene_id": "fix_classes_sample_018",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 7 objects: a car at bottom-left (bbox: x=0.03, y=0.75, w=0.19, h=0.12); a truck at middle-left (bbox: x=0.11, y=0.42, w=0.16, h=0.17); a traffic_light at top-left (bbox: x=0.13, y=0.15, w=0.02, h=0.07); a bicycle at middle-right (bbox: x=0.72, y=0.40, w=0.10, h=0.07); a car at bottom-left (bbox: x=0.10, y=0.77, w=0.12, h=0.10); a building at bottom-center (bbox: x=0.43, y=0.76, w=0.22, h=0.22); a car at top-right (bbox: x=0.81, y=0.04, w=0.18, h=0.13).",
"objects": [
{
"id": 0,
"class_label": "car",
"position": "bottom-left",
"bbox": [
0.027,
0.7491,
0.1941,
0.1155
]
},
{
"id": 1,
"class_label": "truck",
"position": "middle-left",
"bbox": [
0.1092,
0.4239,
0.1552,
0.169
]
},
{
"id": 2,
"class_label": "traffic_light",
"position": "top-left",
"bbox": [
0.1296,
0.1527,
0.0216,
0.0666
]
},
{
"id": 3,
"class_label": "bicycle",
"position": "middle-right",
"bbox": [
0.7168,
0.4022,
0.0966,
0.0716
]
},
{
"id": 4,
"class_label": "car",
"position": "bottom-left",
"bbox": [
0.1018,
0.7741,
0.124,
0.0958
]
},
{
"id": 5,
"class_label": "building",
"position": "bottom-center",
"bbox": [
0.4343,
0.7612,
0.2181,
0.2168
]
},
{
"id": 6,
"class_label": "car",
"position": "top-right",
"bbox": [
0.8111,
0.0398,
0.1766,
0.1255
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.027,
0.7491,
0.1941,
0.1155
],
"class_label": "car"
},
{
"id": 1,
"bbox": [
0.1092,
0.4239,
0.1552,
0.169
],
"class_label": "truck"
},
{
"id": 2,
"bbox": [
0.1296,
0.1527,
0.0216,
0.0666
],
"class_label": "traffic_light"
},
{
"id": 3,
"bbox": [
0.7168,
0.4022,
0.0966,
0.0716
],
"class_label": "bicycle"
},
{
"id": 4,
"bbox": [
0.1018,
0.7741,
0.124,
0.0958
],
"class_label": "car"
},
{
"id": 5,
"bbox": [
0.4343,
0.7612,
0.2181,
0.2168
],
"class_label": "building"
},
{
"id": 6,
"bbox": [
0.8111,
0.0398,
0.1766,
0.1255
],
"class_label": "car"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2018
},
{
"scene_id": "fix_classes_sample_019",
"scene_type": "park",
"scene_description": "A peaceful park setting with trees, benches, and people walking their pets. The scene contains 5 objects: a tree at top-right (bbox: x=0.78, y=0.06, w=0.10, h=0.20); a bicycle at center (bbox: x=0.53, y=0.45, w=0.08, h=0.07); a bicycle at middle-right (bbox: x=0.72, y=0.57, w=0.10, h=0.08); a bicycle at bottom-center (bbox: x=0.35, y=0.76, w=0.09, h=0.07); a person at top-right (bbox: x=0.79, y=0.06, w=0.08, h=0.11).",
"objects": [
{
"id": 0,
"class_label": "tree",
"position": "top-right",
"bbox": [
0.7803,
0.0635,
0.0972,
0.1999
]
},
{
"id": 1,
"class_label": "bicycle",
"position": "center",
"bbox": [
0.529,
0.4504,
0.0848,
0.0744
]
},
{
"id": 2,
"class_label": "bicycle",
"position": "middle-right",
"bbox": [
0.718,
0.5661,
0.0993,
0.0823
]
},
{
"id": 3,
"class_label": "bicycle",
"position": "bottom-center",
"bbox": [
0.3502,
0.7551,
0.0938,
0.0665
]
},
{
"id": 4,
"class_label": "person",
"position": "top-right",
"bbox": [
0.7931,
0.0593,
0.0786,
0.1065
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.7803,
0.0635,
0.0972,
0.1999
],
"class_label": "tree"
},
{
"id": 1,
"bbox": [
0.529,
0.4504,
0.0848,
0.0744
],
"class_label": "bicycle"
},
{
"id": 2,
"bbox": [
0.718,
0.5661,
0.0993,
0.0823
],
"class_label": "bicycle"
},
{
"id": 3,
"bbox": [
0.3502,
0.7551,
0.0938,
0.0665
],
"class_label": "bicycle"
},
{
"id": 4,
"bbox": [
0.7931,
0.0593,
0.0786,
0.1065
],
"class_label": "person"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2019
},
{
"scene_id": "fix_classes_sample_020",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 10 objects: a truck at bottom-center (bbox: x=0.48, y=0.74, w=0.29, h=0.14); a bicycle at top-center (bbox: x=0.37, y=0.20, w=0.09, h=0.07); a bicycle at top-right (bbox: x=0.79, y=0.17, w=0.09, h=0.07); a bicycle at bottom-right (bbox: x=0.74, y=0.81, w=0.10, h=0.11); a person at middle-left (bbox: x=0.26, y=0.56, w=0.04, h=0.18); a bicycle at center (bbox: x=0.49, y=0.41, w=0.11, h=0.07); a truck at center (bbox: x=0.31, y=0.29, w=0.23, h=0.15); a bicycle at middle-left (bbox: x=0.22, y=0.58, w=0.10, h=0.09); a truck at bottom-left (bbox: x=0.16, y=0.65, w=0.21, h=0.16); a traffic_light at middle-right (bbox: x=0.73, y=0.39, w=0.03, h=0.06).",
"objects": [
{
"id": 0,
"class_label": "truck",
"position": "bottom-center",
"bbox": [
0.4842,
0.7396,
0.2919,
0.1379
]
},
{
"id": 1,
"class_label": "bicycle",
"position": "top-center",
"bbox": [
0.3691,
0.1968,
0.0875,
0.0744
]
},
{
"id": 2,
"class_label": "bicycle",
"position": "top-right",
"bbox": [
0.7899,
0.1651,
0.0883,
0.0663
]
},
{
"id": 3,
"class_label": "bicycle",
"position": "bottom-right",
"bbox": [
0.7361,
0.8088,
0.1048,
0.1081
]
},
{
"id": 4,
"class_label": "person",
"position": "middle-left",
"bbox": [
0.255,
0.5592,
0.0449,
0.1798
]
},
{
"id": 5,
"class_label": "bicycle",
"position": "center",
"bbox": [
0.4906,
0.4054,
0.1051,
0.0693
]
},
{
"id": 6,
"class_label": "truck",
"position": "center",
"bbox": [
0.3108,
0.2872,
0.2252,
0.1501
]
},
{
"id": 7,
"class_label": "bicycle",
"position": "middle-left",
"bbox": [
0.2234,
0.5763,
0.104,
0.0941
]
},
{
"id": 8,
"class_label": "truck",
"position": "bottom-left",
"bbox": [
0.1611,
0.6516,
0.208,
0.1616
]
},
{
"id": 9,
"class_label": "traffic_light",
"position": "middle-right",
"bbox": [
0.7307,
0.3901,
0.0326,
0.0636
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.4842,
0.7396,
0.2919,
0.1379
],
"class_label": "truck"
},
{
"id": 1,
"bbox": [
0.3691,
0.1968,
0.0875,
0.0744
],
"class_label": "bicycle"
},
{
"id": 2,
"bbox": [
0.7899,
0.1651,
0.0883,
0.0663
],
"class_label": "bicycle"
},
{
"id": 3,
"bbox": [
0.7361,
0.8088,
0.1048,
0.1081
],
"class_label": "bicycle"
},
{
"id": 4,
"bbox": [
0.255,
0.5592,
0.0449,
0.1798
],
"class_label": "person"
},
{
"id": 5,
"bbox": [
0.4906,
0.4054,
0.1051,
0.0693
],
"class_label": "bicycle"
},
{
"id": 6,
"bbox": [
0.3108,
0.2872,
0.2252,
0.1501
],
"class_label": "truck"
},
{
"id": 7,
"bbox": [
0.2234,
0.5763,
0.104,
0.0941
],
"class_label": "bicycle"
},
{
"id": 8,
"bbox": [
0.1611,
0.6516,
0.208,
0.1616
],
"class_label": "truck"
},
{
"id": 9,
"bbox": [
0.7307,
0.3901,
0.0326,
0.0636
],
"class_label": "traffic_light"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2020
},
{
"scene_id": "fix_classes_sample_021",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 9 objects: a dog at center (bbox: x=0.61, y=0.46, w=0.06, h=0.07); a building at middle-right (bbox: x=0.78, y=0.24, w=0.20, h=0.32); a bench at top-left (bbox: x=0.14, y=0.08, w=0.13, h=0.07); a bench at bottom-center (bbox: x=0.50, y=0.79, w=0.09, h=0.07); a bench at center (bbox: x=0.53, y=0.52, w=0.12, h=0.07); a tree at middle-left (bbox: x=0.05, y=0.39, w=0.15, h=0.24); a car at bottom-center (bbox: x=0.28, y=0.76, w=0.14, h=0.09); a tree at middle-left (bbox: x=0.08, y=0.32, w=0.13, h=0.32); a cat at middle-right (bbox: x=0.72, y=0.35, w=0.07, h=0.05).",
"objects": [
{
"id": 0,
"class_label": "dog",
"position": "center",
"bbox": [
0.6109,
0.4594,
0.0624,
0.0654
]
},
{
"id": 1,
"class_label": "building",
"position": "middle-right",
"bbox": [
0.7807,
0.239,
0.204,
0.3188
]
},
{
"id": 2,
"class_label": "bench",
"position": "top-left",
"bbox": [
0.1436,
0.0751,
0.132,
0.0702
]
},
{
"id": 3,
"class_label": "bench",
"position": "bottom-center",
"bbox": [
0.4966,
0.7936,
0.088,
0.0681
]
},
{
"id": 4,
"class_label": "bench",
"position": "center",
"bbox": [
0.5316,
0.5232,
0.1169,
0.0701
]
},
{
"id": 5,
"class_label": "tree",
"position": "middle-left",
"bbox": [
0.0487,
0.3934,
0.1488,
0.2385
]
},
{
"id": 6,
"class_label": "car",
"position": "bottom-center",
"bbox": [
0.2803,
0.7625,
0.1424,
0.0896
]
},
{
"id": 7,
"class_label": "tree",
"position": "middle-left",
"bbox": [
0.083,
0.32,
0.1329,
0.3161
]
},
{
"id": 8,
"class_label": "cat",
"position": "middle-right",
"bbox": [
0.721,
0.3518,
0.0677,
0.0478
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.6109,
0.4594,
0.0624,
0.0654
],
"class_label": "dog"
},
{
"id": 1,
"bbox": [
0.7807,
0.239,
0.204,
0.3188
],
"class_label": "building"
},
{
"id": 2,
"bbox": [
0.1436,
0.0751,
0.132,
0.0702
],
"class_label": "bench"
},
{
"id": 3,
"bbox": [
0.4966,
0.7936,
0.088,
0.0681
],
"class_label": "bench"
},
{
"id": 4,
"bbox": [
0.5316,
0.5232,
0.1169,
0.0701
],
"class_label": "bench"
},
{
"id": 5,
"bbox": [
0.0487,
0.3934,
0.1488,
0.2385
],
"class_label": "tree"
},
{
"id": 6,
"bbox": [
0.2803,
0.7625,
0.1424,
0.0896
],
"class_label": "car"
},
{
"id": 7,
"bbox": [
0.083,
0.32,
0.1329,
0.3161
],
"class_label": "tree"
},
{
"id": 8,
"bbox": [
0.721,
0.3518,
0.0677,
0.0478
],
"class_label": "cat"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2021
},
{
"scene_id": "fix_classes_sample_022",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 8 objects: a traffic_light at bottom-right (bbox: x=0.84, y=0.87, w=0.03, h=0.06); a traffic_light at middle-right (bbox: x=0.83, y=0.40, w=0.04, h=0.09); a building at bottom-center (bbox: x=0.23, y=0.67, w=0.26, h=0.33); a person at top-left (bbox: x=0.14, y=0.07, w=0.08, h=0.23); a car at bottom-left (bbox: x=0.04, y=0.79, w=0.14, h=0.09); a traffic_light at top-center (bbox: x=0.50, y=0.18, w=0.03, h=0.09); a traffic_light at center (bbox: x=0.49, y=0.40, w=0.04, h=0.09); a person at top-left (bbox: x=0.22, y=0.13, w=0.06, h=0.10).",
"objects": [
{
"id": 0,
"class_label": "traffic_light",
"position": "bottom-right",
"bbox": [
0.8436,
0.8652,
0.0262,
0.0624
]
},
{
"id": 1,
"class_label": "traffic_light",
"position": "middle-right",
"bbox": [
0.8341,
0.3954,
0.0362,
0.0944
]
},
{
"id": 2,
"class_label": "building",
"position": "bottom-center",
"bbox": [
0.2314,
0.6701,
0.2599,
0.3299
]
},
{
"id": 3,
"class_label": "person",
"position": "top-left",
"bbox": [
0.1355,
0.0654,
0.0762,
0.2314
]
},
{
"id": 4,
"class_label": "car",
"position": "bottom-left",
"bbox": [
0.0404,
0.7887,
0.1398,
0.0917
]
},
{
"id": 5,
"class_label": "traffic_light",
"position": "top-center",
"bbox": [
0.5017,
0.1826,
0.0336,
0.087
]
},
{
"id": 6,
"class_label": "traffic_light",
"position": "center",
"bbox": [
0.4924,
0.3996,
0.0385,
0.0941
]
},
{
"id": 7,
"class_label": "person",
"position": "top-left",
"bbox": [
0.2201,
0.1322,
0.0573,
0.1042
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.8436,
0.8652,
0.0262,
0.0624
],
"class_label": "traffic_light"
},
{
"id": 1,
"bbox": [
0.8341,
0.3954,
0.0362,
0.0944
],
"class_label": "traffic_light"
},
{
"id": 2,
"bbox": [
0.2314,
0.6701,
0.2599,
0.3299
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.1355,
0.0654,
0.0762,
0.2314
],
"class_label": "person"
},
{
"id": 4,
"bbox": [
0.0404,
0.7887,
0.1398,
0.0917
],
"class_label": "car"
},
{
"id": 5,
"bbox": [
0.5017,
0.1826,
0.0336,
0.087
],
"class_label": "traffic_light"
},
{
"id": 6,
"bbox": [
0.4924,
0.3996,
0.0385,
0.0941
],
"class_label": "traffic_light"
},
{
"id": 7,
"bbox": [
0.2201,
0.1322,
0.0573,
0.1042
],
"class_label": "person"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2022
},
{
"scene_id": "fix_classes_sample_023",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 9 objects: a car at bottom-left (bbox: x=0.09, y=0.66, w=0.15, h=0.12); a building at center (bbox: x=0.35, y=0.24, w=0.32, h=0.33); a tree at top-left (bbox: x=0.08, y=0.19, w=0.09, h=0.16); a building at middle-left (bbox: x=0.10, y=0.29, w=0.18, h=0.32); a building at top-center (bbox: x=0.23, y=0.00, w=0.26, h=0.32); a tree at top-center (bbox: x=0.58, y=0.11, w=0.12, h=0.16); a tree at top-right (bbox: x=0.82, y=0.10, w=0.12, h=0.33); a cat at top-center (bbox: x=0.46, y=0.26, w=0.06, h=0.04); a building at bottom-right (bbox: x=0.65, y=0.55, w=0.33, h=0.42).",
"objects": [
{
"id": 0,
"class_label": "car",
"position": "bottom-left",
"bbox": [
0.0934,
0.66,
0.148,
0.12
]
},
{
"id": 1,
"class_label": "building",
"position": "center",
"bbox": [
0.3494,
0.2369,
0.3177,
0.3329
]
},
{
"id": 2,
"class_label": "tree",
"position": "top-left",
"bbox": [
0.0778,
0.1878,
0.0948,
0.164
]
},
{
"id": 3,
"class_label": "building",
"position": "middle-left",
"bbox": [
0.0989,
0.2924,
0.1809,
0.32
]
},
{
"id": 4,
"class_label": "building",
"position": "top-center",
"bbox": [
0.2304,
0.0,
0.2576,
0.3153
]
},
{
"id": 5,
"class_label": "tree",
"position": "top-center",
"bbox": [
0.585,
0.1141,
0.1207,
0.1638
]
},
{
"id": 6,
"class_label": "tree",
"position": "top-right",
"bbox": [
0.8158,
0.0991,
0.1173,
0.3288
]
},
{
"id": 7,
"class_label": "cat",
"position": "top-center",
"bbox": [
0.4609,
0.2612,
0.063,
0.0417
]
},
{
"id": 8,
"class_label": "building",
"position": "bottom-right",
"bbox": [
0.6509,
0.5535,
0.3284,
0.4187
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.0934,
0.66,
0.148,
0.12
],
"class_label": "car"
},
{
"id": 1,
"bbox": [
0.3494,
0.2369,
0.3177,
0.3329
],
"class_label": "building"
},
{
"id": 2,
"bbox": [
0.0778,
0.1878,
0.0948,
0.164
],
"class_label": "tree"
},
{
"id": 3,
"bbox": [
0.0989,
0.2924,
0.1809,
0.32
],
"class_label": "building"
},
{
"id": 4,
"bbox": [
0.2304,
0.0,
0.2576,
0.3153
],
"class_label": "building"
},
{
"id": 5,
"bbox": [
0.585,
0.1141,
0.1207,
0.1638
],
"class_label": "tree"
},
{
"id": 6,
"bbox": [
0.8158,
0.0991,
0.1173,
0.3288
],
"class_label": "tree"
},
{
"id": 7,
"bbox": [
0.4609,
0.2612,
0.063,
0.0417
],
"class_label": "cat"
},
{
"id": 8,
"bbox": [
0.6509,
0.5535,
0.3284,
0.4187
],
"class_label": "building"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2023
},
{
"scene_id": "fix_classes_sample_024",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 5 objects: a cat at center (bbox: x=0.55, y=0.55, w=0.05, h=0.06); a dog at middle-left (bbox: x=0.13, y=0.47, w=0.08, h=0.07); a dog at middle-left (bbox: x=0.17, y=0.54, w=0.07, h=0.07); a bench at middle-left (bbox: x=0.22, y=0.56, w=0.13, h=0.07); a cat at top-right (bbox: x=0.87, y=0.22, w=0.06, h=0.07).",
"objects": [
{
"id": 0,
"class_label": "cat",
"position": "center",
"bbox": [
0.5532,
0.5467,
0.048,
0.0617
]
},
{
"id": 1,
"class_label": "dog",
"position": "middle-left",
"bbox": [
0.1299,
0.4735,
0.0818,
0.0694
]
},
{
"id": 2,
"class_label": "dog",
"position": "middle-left",
"bbox": [
0.1711,
0.5353,
0.0655,
0.0682
]
},
{
"id": 3,
"class_label": "bench",
"position": "middle-left",
"bbox": [
0.2208,
0.5635,
0.1282,
0.0718
]
},
{
"id": 4,
"class_label": "cat",
"position": "top-right",
"bbox": [
0.8652,
0.2211,
0.0613,
0.066
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.5532,
0.5467,
0.048,
0.0617
],
"class_label": "cat"
},
{
"id": 1,
"bbox": [
0.1299,
0.4735,
0.0818,
0.0694
],
"class_label": "dog"
},
{
"id": 2,
"bbox": [
0.1711,
0.5353,
0.0655,
0.0682
],
"class_label": "dog"
},
{
"id": 3,
"bbox": [
0.2208,
0.5635,
0.1282,
0.0718
],
"class_label": "bench"
},
{
"id": 4,
"bbox": [
0.8652,
0.2211,
0.0613,
0.066
],
"class_label": "cat"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2024
},
{
"scene_id": "fix_classes_sample_025",
"scene_type": "intersection",
"scene_description": "A road intersection with traffic lights, vehicles, and crossing pedestrians. The scene contains 6 objects: a building at bottom-center (bbox: x=0.29, y=0.61, w=0.34, h=0.33); a truck at top-center (bbox: x=0.28, y=0.09, w=0.21, h=0.11); a traffic_light at top-center (bbox: x=0.50, y=0.07, w=0.03, h=0.08); a truck at middle-left (bbox: x=0.18, y=0.53, w=0.15, h=0.12); a traffic_light at bottom-center (bbox: x=0.52, y=0.76, w=0.03, h=0.10); a truck at top-center (bbox: x=0.49, y=0.16, w=0.19, h=0.10).",
"objects": [
{
"id": 0,
"class_label": "building",
"position": "bottom-center",
"bbox": [
0.2917,
0.609,
0.3394,
0.3323
]
},
{
"id": 1,
"class_label": "truck",
"position": "top-center",
"bbox": [
0.2819,
0.0884,
0.2074,
0.1078
]
},
{
"id": 2,
"class_label": "traffic_light",
"position": "top-center",
"bbox": [
0.502,
0.0711,
0.0282,
0.0845
]
},
{
"id": 3,
"class_label": "truck",
"position": "middle-left",
"bbox": [
0.1802,
0.5254,
0.154,
0.1182
]
},
{
"id": 4,
"class_label": "traffic_light",
"position": "bottom-center",
"bbox": [
0.5152,
0.761,
0.0271,
0.0965
]
},
{
"id": 5,
"class_label": "truck",
"position": "top-center",
"bbox": [
0.4921,
0.1592,
0.1865,
0.1026
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.2917,
0.609,
0.3394,
0.3323
],
"class_label": "building"
},
{
"id": 1,
"bbox": [
0.2819,
0.0884,
0.2074,
0.1078
],
"class_label": "truck"
},
{
"id": 2,
"bbox": [
0.502,
0.0711,
0.0282,
0.0845
],
"class_label": "traffic_light"
},
{
"id": 3,
"bbox": [
0.1802,
0.5254,
0.154,
0.1182
],
"class_label": "truck"
},
{
"id": 4,
"bbox": [
0.5152,
0.761,
0.0271,
0.0965
],
"class_label": "traffic_light"
},
{
"id": 5,
"bbox": [
0.4921,
0.1592,
0.1865,
0.1026
],
"class_label": "truck"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2025
},
{
"scene_id": "fix_classes_sample_026",
"scene_type": "urban_street",
"scene_description": "A busy urban street scene with vehicles, pedestrians, and city infrastructure. The scene contains 7 objects: a truck at middle-left (bbox: x=0.04, y=0.45, w=0.28, h=0.15); a bench at bottom-center (bbox: x=0.33, y=0.83, w=0.10, h=0.07); a bench at top-left (bbox: x=0.17, y=0.11, w=0.14, h=0.07); a traffic_light at middle-right (bbox: x=0.84, y=0.60, w=0.04, h=0.10); a truck at middle-right (bbox: x=0.68, y=0.32, w=0.16, h=0.14); a traffic_light at top-left (bbox: x=0.17, y=0.08, w=0.04, h=0.07); a bench at top-center (bbox: x=0.56, y=0.24, w=0.11, h=0.07).",
"objects": [
{
"id": 0,
"class_label": "truck",
"position": "middle-left",
"bbox": [
0.042,
0.4469,
0.2842,
0.1497
]
},
{
"id": 1,
"class_label": "bench",
"position": "bottom-center",
"bbox": [
0.3348,
0.8291,
0.0968,
0.0684
]
},
{
"id": 2,
"class_label": "bench",
"position": "top-left",
"bbox": [
0.1674,
0.1068,
0.137,
0.0706
]
},
{
"id": 3,
"class_label": "traffic_light",
"position": "middle-right",
"bbox": [
0.8412,
0.6013,
0.0396,
0.0972
]
},
{
"id": 4,
"class_label": "truck",
"position": "middle-right",
"bbox": [
0.6758,
0.3207,
0.1634,
0.143
]
},
{
"id": 5,
"class_label": "traffic_light",
"position": "top-left",
"bbox": [
0.1737,
0.0808,
0.037,
0.0748
]
},
{
"id": 6,
"class_label": "bench",
"position": "top-center",
"bbox": [
0.5551,
0.238,
0.1098,
0.0741
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.042,
0.4469,
0.2842,
0.1497
],
"class_label": "truck"
},
{
"id": 1,
"bbox": [
0.3348,
0.8291,
0.0968,
0.0684
],
"class_label": "bench"
},
{
"id": 2,
"bbox": [
0.1674,
0.1068,
0.137,
0.0706
],
"class_label": "bench"
},
{
"id": 3,
"bbox": [
0.8412,
0.6013,
0.0396,
0.0972
],
"class_label": "traffic_light"
},
{
"id": 4,
"bbox": [
0.6758,
0.3207,
0.1634,
0.143
],
"class_label": "truck"
},
{
"id": 5,
"bbox": [
0.1737,
0.0808,
0.037,
0.0748
],
"class_label": "traffic_light"
},
{
"id": 6,
"bbox": [
0.5551,
0.238,
0.1098,
0.0741
],
"class_label": "bench"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2026
},
{
"scene_id": "fix_classes_sample_027",
"scene_type": "urban_street",
"scene_description": "A busy urban street scene with vehicles, pedestrians, and city infrastructure. The scene contains 8 objects: a truck at top-left (bbox: x=0.10, y=0.18, w=0.25, h=0.16); a tree at top-right (bbox: x=0.71, y=0.13, w=0.10, h=0.19); a building at center (bbox: x=0.52, y=0.33, w=0.16, h=0.44); a traffic_light at bottom-left (bbox: x=0.26, y=0.84, w=0.03, h=0.07); a bicycle at bottom-left (bbox: x=0.21, y=0.74, w=0.09, h=0.07); a building at top-center (bbox: x=0.46, y=0.00, w=0.30, h=0.42); a bench at center (bbox: x=0.59, y=0.45, w=0.12, h=0.06); a truck at top-right (bbox: x=0.77, y=0.17, w=0.19, h=0.11).",
"objects": [
{
"id": 0,
"class_label": "truck",
"position": "top-left",
"bbox": [
0.101,
0.1795,
0.2483,
0.1634
]
},
{
"id": 1,
"class_label": "tree",
"position": "top-right",
"bbox": [
0.7056,
0.129,
0.1043,
0.1858
]
},
{
"id": 2,
"class_label": "building",
"position": "center",
"bbox": [
0.5164,
0.3275,
0.1634,
0.4374
]
},
{
"id": 3,
"class_label": "traffic_light",
"position": "bottom-left",
"bbox": [
0.2606,
0.8354,
0.0301,
0.0663
]
},
{
"id": 4,
"class_label": "bicycle",
"position": "bottom-left",
"bbox": [
0.2147,
0.7399,
0.0872,
0.0698
]
},
{
"id": 5,
"class_label": "building",
"position": "top-center",
"bbox": [
0.4562,
0.0,
0.3039,
0.4205
]
},
{
"id": 6,
"class_label": "bench",
"position": "center",
"bbox": [
0.5909,
0.4452,
0.1168,
0.0582
]
},
{
"id": 7,
"class_label": "truck",
"position": "top-right",
"bbox": [
0.7651,
0.1696,
0.1909,
0.1058
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.101,
0.1795,
0.2483,
0.1634
],
"class_label": "truck"
},
{
"id": 1,
"bbox": [
0.7056,
0.129,
0.1043,
0.1858
],
"class_label": "tree"
},
{
"id": 2,
"bbox": [
0.5164,
0.3275,
0.1634,
0.4374
],
"class_label": "building"
},
{
"id": 3,
"bbox": [
0.2606,
0.8354,
0.0301,
0.0663
],
"class_label": "traffic_light"
},
{
"id": 4,
"bbox": [
0.2147,
0.7399,
0.0872,
0.0698
],
"class_label": "bicycle"
},
{
"id": 5,
"bbox": [
0.4562,
0.0,
0.3039,
0.4205
],
"class_label": "building"
},
{
"id": 6,
"bbox": [
0.5909,
0.4452,
0.1168,
0.0582
],
"class_label": "bench"
},
{
"id": 7,
"bbox": [
0.7651,
0.1696,
0.1909,
0.1058
],
"class_label": "truck"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2027
},
{
"scene_id": "fix_classes_sample_028",
"scene_type": "parking_lot",
"scene_description": "A parking lot with various vehicles and some pedestrians. The scene contains 7 objects: a car at middle-right (bbox: x=0.75, y=0.33, w=0.15, h=0.15); a building at middle-right (bbox: x=0.68, y=0.45, w=0.26, h=0.34); a car at middle-left (bbox: x=0.17, y=0.39, w=0.10, h=0.10); a truck at bottom-left (bbox: x=0.08, y=0.82, w=0.29, h=0.15); a bicycle at top-right (bbox: x=0.79, y=0.13, w=0.08, h=0.08); a truck at bottom-right (bbox: x=0.79, y=0.84, w=0.18, h=0.12); a bicycle at bottom-right (bbox: x=0.80, y=0.76, w=0.09, h=0.07).",
"objects": [
{
"id": 0,
"class_label": "car",
"position": "middle-right",
"bbox": [
0.7541,
0.3326,
0.1543,
0.1474
]
},
{
"id": 1,
"class_label": "building",
"position": "middle-right",
"bbox": [
0.6763,
0.4525,
0.2553,
0.3423
]
},
{
"id": 2,
"class_label": "car",
"position": "middle-left",
"bbox": [
0.1654,
0.3879,
0.1021,
0.1011
]
},
{
"id": 3,
"class_label": "truck",
"position": "bottom-left",
"bbox": [
0.0784,
0.8225,
0.2921,
0.1539
]
},
{
"id": 4,
"class_label": "bicycle",
"position": "top-right",
"bbox": [
0.7853,
0.1297,
0.0847,
0.0804
]
},
{
"id": 5,
"class_label": "truck",
"position": "bottom-right",
"bbox": [
0.7877,
0.8386,
0.1764,
0.119
]
},
{
"id": 6,
"class_label": "bicycle",
"position": "bottom-right",
"bbox": [
0.7975,
0.7614,
0.0887,
0.0731
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.7541,
0.3326,
0.1543,
0.1474
],
"class_label": "car"
},
{
"id": 1,
"bbox": [
0.6763,
0.4525,
0.2553,
0.3423
],
"class_label": "building"
},
{
"id": 2,
"bbox": [
0.1654,
0.3879,
0.1021,
0.1011
],
"class_label": "car"
},
{
"id": 3,
"bbox": [
0.0784,
0.8225,
0.2921,
0.1539
],
"class_label": "truck"
},
{
"id": 4,
"bbox": [
0.7853,
0.1297,
0.0847,
0.0804
],
"class_label": "bicycle"
},
{
"id": 5,
"bbox": [
0.7877,
0.8386,
0.1764,
0.119
],
"class_label": "truck"
},
{
"id": 6,
"bbox": [
0.7975,
0.7614,
0.0887,
0.0731
],
"class_label": "bicycle"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2028
},
{
"scene_id": "fix_classes_sample_029",
"scene_type": "residential_area",
"scene_description": "A quiet residential neighborhood with houses, trees, and occasional pedestrians. The scene contains 7 objects: a tree at top-right (bbox: x=0.73, y=0.05, w=0.15, h=0.32); a person at middle-right (bbox: x=0.85, y=0.50, w=0.08, h=0.18); a car at bottom-center (bbox: x=0.27, y=0.84, w=0.18, h=0.10); a car at top-right (bbox: x=0.64, y=0.20, w=0.13, h=0.12); a building at bottom-left (bbox: x=0.13, y=0.74, w=0.21, h=0.26); a bench at center (bbox: x=0.32, y=0.39, w=0.12, h=0.05); a car at bottom-center (bbox: x=0.54, y=0.78, w=0.16, h=0.15).",
"objects": [
{
"id": 0,
"class_label": "tree",
"position": "top-right",
"bbox": [
0.7292,
0.0461,
0.1496,
0.3199
]
},
{
"id": 1,
"class_label": "person",
"position": "middle-right",
"bbox": [
0.8466,
0.5028,
0.0772,
0.1796
]
},
{
"id": 2,
"class_label": "car",
"position": "bottom-center",
"bbox": [
0.2694,
0.8382,
0.1797,
0.0978
]
},
{
"id": 3,
"class_label": "car",
"position": "top-right",
"bbox": [
0.6393,
0.204,
0.1292,
0.1201
]
},
{
"id": 4,
"class_label": "building",
"position": "bottom-left",
"bbox": [
0.1285,
0.7366,
0.2068,
0.2634
]
},
{
"id": 5,
"class_label": "bench",
"position": "center",
"bbox": [
0.32,
0.3899,
0.1224,
0.0522
]
},
{
"id": 6,
"class_label": "car",
"position": "bottom-center",
"bbox": [
0.5395,
0.784,
0.1562,
0.1461
]
}
],
"gold_annotations": [
{
"id": 0,
"bbox": [
0.7292,
0.0461,
0.1496,
0.3199
],
"class_label": "tree"
},
{
"id": 1,
"bbox": [
0.8466,
0.5028,
0.0772,
0.1796
],
"class_label": "person"
},
{
"id": 2,
"bbox": [
0.2694,
0.8382,
0.1797,
0.0978
],
"class_label": "car"
},
{
"id": 3,
"bbox": [
0.6393,
0.204,
0.1292,
0.1201
],
"class_label": "car"
},
{
"id": 4,
"bbox": [
0.1285,
0.7366,
0.2068,
0.2634
],
"class_label": "building"
},
{
"id": 5,
"bbox": [
0.32,
0.3899,
0.1224,
0.0522
],
"class_label": "bench"
},
{
"id": 6,
"bbox": [
0.5395,
0.784,
0.1562,
0.1461
],
"class_label": "car"
}
],
"task_id": "fix_classes",
"difficulty": "medium",
"seed": 2029
}
]