diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..d86d2111d07c3178d0ecb1c82b02b4059c3a01e1 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,285 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_eating_task/ball_eating_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_eating_task/ball_eating_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_eating_task/ball_eating_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ballcolor_task/ballcolor_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ballcolor_task/ballcolor_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ballcolor_task/ballcolor_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/bfs_task/bfs_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/bfs_task/bfs_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/bfs_task/bfs_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/bookshelf_task/bookshelf_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/bookshelf_task/bookshelf_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/bookshelf_task/bookshelf_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/clock_task/clock_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/clock_task/clock_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/clock_task/clock_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_addition_task/color_addition_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_addition_task/color_addition_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_addition_task/color_addition_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_mixing_task/color_mixing_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_mixing_task/color_mixing_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_mixing_task/color_mixing_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/counting_objects_task/counting_objects_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/counting_objects_task/counting_objects_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/counting_objects_task/counting_objects_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_shift_task/grid_shift_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_shift_task/grid_shift_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_shift_task/grid_shift_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000000/final_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000000/first_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000001/final_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000001/first_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000002/final_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000002/first_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/homography_task/homography_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_objects_task/identify_objects_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_objects_task/identify_objects_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_objects_task/identify_objects_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/final_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/final_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/final_frame.png filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/majority_color_task/majority_color_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/majority_color_task/majority_color_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/majority_color_task/majority_color_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/object_packing_task/object_packing_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/object_packing_task/object_packing_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/object_packing_task/object_packing_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/resize_object_task/resize_object_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/resize_object_task/resize_object_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/resize_object_task/resize_object_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rotation_task/rotation_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rotation_task/rotation_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/rotation_task/rotation_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/stable_sort_task/stable_sort_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/stable_sort_task/stable_sort_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/stable_sort_task/stable_sort_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text +VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/ground_truth.mp4 filter=lfs diff=lfs merge=lfs -text diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/final_frame.png b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4a6d2bb9d81542792d19c5514d62d7419a029728 Binary files /dev/null and b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/final_frame.png differ diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/first_frame.png b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f3d40b24e13e7ecb4638249d2a0462fd9d6d817d Binary files /dev/null and b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/first_frame.png differ diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/ground_truth.mp4 b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..efc16179b5419237d46c55cfee8e9023680215d2 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6198704650ad627984fdf081cd511a79dace47914f710a6680326fa9efac921d +size 330432 diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/metadata.json b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..baaa06cc54dea8a0318d61f392a69a51a6ebbc06 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/metadata.json @@ -0,0 +1,210 @@ +{ + "task_id": "O-6_animal_color_sorting_00000000", + "generator": "O-6_animal_color_sorting", + "timestamp": "2026-02-17T08:06:33.441436", + "parameters": { + "num_colors": 3, + "animals_per_color": 2, + "animal_size": 35, + "animals": [ + { + "symbol": "animal_0", + "index": 0, + "id": "pink_cat_0", + "type": "cat", + "color_name": "pink", + "color_rgb": [ + 255, + 105, + 180 + ], + "size": 35, + "initial_center": [ + 412, + 223 + ], + "target_center": [ + 186, + 914 + ] + }, + { + "symbol": "animal_1", + "index": 1, + "id": "green_fox_1", + "type": "fox", + "color_name": "green", + "color_rgb": [ + 60, + 180, + 60 + ], + "size": 35, + "initial_center": [ + 392, + 462 + ], + "target_center": [ + 768, + 914 + ] + }, + { + "symbol": "animal_2", + "index": 2, + "id": "yellow_dog_0", + "type": "dog", + "color_name": "yellow", + "color_rgb": [ + 240, + 200, + 0 + ], + "size": 35, + "initial_center": [ + 687, + 562 + ], + "target_center": [ + 477, + 914 + ] + }, + { + "symbol": "animal_3", + "index": 3, + "id": "pink_bear_1", + "type": "bear", + "color_name": "pink", + "color_rgb": [ + 255, + 105, + 180 + ], + "size": 35, + "initial_center": [ + 703, + 169 + ], + "target_center": [ + 256, + 914 + ] + }, + { + "symbol": "animal_4", + "index": 4, + "id": "yellow_rabbit_1", + "type": "rabbit", + "color_name": "yellow", + "color_rgb": [ + 240, + 200, + 0 + ], + "size": 35, + "initial_center": [ + 965, + 183 + ], + "target_center": [ + 547, + 914 + ] + }, + { + "symbol": "animal_5", + "index": 5, + "id": "green_panda_0", + "type": "panda", + "color_name": "green", + "color_rgb": [ + 60, + 180, + 60 + ], + "size": 35, + "initial_center": [ + 75, + 157 + ], + "target_center": [ + 838, + 914 + ] + } + ], + "containers": [ + { + "symbol": "container_0", + "index": 0, + "color_name": "pink", + "color_rgb": [ + 255, + 105, + 180 + ], + "rect": [ + 151, + 874, + 140, + 120 + ], + "center": [ + 221, + 934 + ] + }, + { + "symbol": "container_1", + "index": 1, + "color_name": "yellow", + "color_rgb": [ + 240, + 200, + 0 + ], + "rect": [ + 442, + 874, + 140, + 120 + ], + "center": [ + 512, + 934 + ] + }, + { + "symbol": "container_2", + "index": 2, + "color_name": "green", + "color_rgb": [ + 60, + 180, + 60 + ], + "rect": [ + 733, + 874, + 140, + 120 + ], + "center": [ + 803, + 934 + ] + } + ] + }, + "param_hash": "cefa346f8df64ca0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/prompt.txt b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c37e147c4e187416654e751dae44c3a32960f139 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000000/prompt.txt @@ -0,0 +1 @@ +Colored animal faces are scattered at the top of the canvas, and containers with colored borders are at the bottom. Sort each animal into the container with the matching border color. \ No newline at end of file diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/final_frame.png b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..27b640e3504e1c166e3b577ed885e020ce69e1cd Binary files /dev/null and b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/final_frame.png differ diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/first_frame.png b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..104818c916b30e2fb50e395bd50dec4056a7dbfe Binary files /dev/null and b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/first_frame.png differ diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/ground_truth.mp4 b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..014404b9f5311b56a58b12092def53467f798cd7 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9743050e17f19d9666fbd9de83ebd33b4620831b081338d809a425b7b392fb8f +size 296716 diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/metadata.json b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0d9e5c7845926eda086d77ed132c6b06981422d7 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/metadata.json @@ -0,0 +1,210 @@ +{ + "task_id": "O-6_animal_color_sorting_00000001", + "generator": "O-6_animal_color_sorting", + "timestamp": "2026-02-17T08:06:33.890534", + "parameters": { + "num_colors": 3, + "animals_per_color": 2, + "animal_size": 35, + "animals": [ + { + "symbol": "animal_0", + "index": 0, + "id": "green_fox_0", + "type": "fox", + "color_name": "green", + "color_rgb": [ + 60, + 180, + 60 + ], + "size": 35, + "initial_center": [ + 388, + 587 + ], + "target_center": [ + 186, + 914 + ] + }, + { + "symbol": "animal_1", + "index": 1, + "id": "navy_rabbit_0", + "type": "rabbit", + "color_name": "navy", + "color_rgb": [ + 60, + 80, + 180 + ], + "size": 35, + "initial_center": [ + 614, + 177 + ], + "target_center": [ + 768, + 914 + ] + }, + { + "symbol": "animal_2", + "index": 2, + "id": "navy_panda_1", + "type": "panda", + "color_name": "navy", + "color_rgb": [ + 60, + 80, + 180 + ], + "size": 35, + "initial_center": [ + 170, + 73 + ], + "target_center": [ + 838, + 914 + ] + }, + { + "symbol": "animal_3", + "index": 3, + "id": "purple_bear_0", + "type": "bear", + "color_name": "purple", + "color_rgb": [ + 150, + 80, + 200 + ], + "size": 35, + "initial_center": [ + 559, + 404 + ], + "target_center": [ + 477, + 914 + ] + }, + { + "symbol": "animal_4", + "index": 4, + "id": "green_dog_1", + "type": "dog", + "color_name": "green", + "color_rgb": [ + 60, + 180, + 60 + ], + "size": 35, + "initial_center": [ + 785, + 430 + ], + "target_center": [ + 256, + 914 + ] + }, + { + "symbol": "animal_5", + "index": 5, + "id": "purple_cat_1", + "type": "cat", + "color_name": "purple", + "color_rgb": [ + 150, + 80, + 200 + ], + "size": 35, + "initial_center": [ + 838, + 70 + ], + "target_center": [ + 547, + 914 + ] + } + ], + "containers": [ + { + "symbol": "container_0", + "index": 0, + "color_name": "green", + "color_rgb": [ + 60, + 180, + 60 + ], + "rect": [ + 151, + 874, + 140, + 120 + ], + "center": [ + 221, + 934 + ] + }, + { + "symbol": "container_1", + "index": 1, + "color_name": "purple", + "color_rgb": [ + 150, + 80, + 200 + ], + "rect": [ + 442, + 874, + 140, + 120 + ], + "center": [ + 512, + 934 + ] + }, + { + "symbol": "container_2", + "index": 2, + "color_name": "navy", + "color_rgb": [ + 60, + 80, + 180 + ], + "rect": [ + 733, + 874, + 140, + 120 + ], + "center": [ + 803, + 934 + ] + } + ] + }, + "param_hash": "d027005fcfa1265b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/prompt.txt b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c37e147c4e187416654e751dae44c3a32960f139 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000001/prompt.txt @@ -0,0 +1 @@ +Colored animal faces are scattered at the top of the canvas, and containers with colored borders are at the bottom. Sort each animal into the container with the matching border color. \ No newline at end of file diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/final_frame.png b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..44364cfa30952cc40039d0ce2f21bfc463f00d2d Binary files /dev/null and b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/final_frame.png differ diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/first_frame.png b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..85609742ffd66172f9a1d664afcd607678eb733d Binary files /dev/null and b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/first_frame.png differ diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/ground_truth.mp4 b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a95c277ab5ab9f746ffe04d7e234d82a129354b7 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a76ce4503df46547442663f92e663fc00959bb5ee00d83d63c6a24426835b1cb +size 279406 diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/metadata.json b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..e4de898f62621e60b2f82c51d13139ff2927c139 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/metadata.json @@ -0,0 +1,210 @@ +{ + "task_id": "O-6_animal_color_sorting_00000002", + "generator": "O-6_animal_color_sorting", + "timestamp": "2026-02-17T08:06:34.290245", + "parameters": { + "num_colors": 3, + "animals_per_color": 2, + "animal_size": 35, + "animals": [ + { + "symbol": "animal_0", + "index": 0, + "id": "coral_cat_0", + "type": "cat", + "color_name": "coral", + "color_rgb": [ + 255, + 127, + 80 + ], + "size": 35, + "initial_center": [ + 542, + 496 + ], + "target_center": [ + 768, + 914 + ] + }, + { + "symbol": "animal_1", + "index": 1, + "id": "brown_dog_1", + "type": "dog", + "color_name": "brown", + "color_rgb": [ + 165, + 90, + 50 + ], + "size": 35, + "initial_center": [ + 334, + 393 + ], + "target_center": [ + 186, + 914 + ] + }, + { + "symbol": "animal_2", + "index": 2, + "id": "pink_rabbit_0", + "type": "rabbit", + "color_name": "pink", + "color_rgb": [ + 255, + 105, + 180 + ], + "size": 35, + "initial_center": [ + 917, + 626 + ], + "target_center": [ + 477, + 914 + ] + }, + { + "symbol": "animal_3", + "index": 3, + "id": "pink_panda_1", + "type": "panda", + "color_name": "pink", + "color_rgb": [ + 255, + 105, + 180 + ], + "size": 35, + "initial_center": [ + 562, + 179 + ], + "target_center": [ + 547, + 914 + ] + }, + { + "symbol": "animal_4", + "index": 4, + "id": "brown_fox_0", + "type": "fox", + "color_name": "brown", + "color_rgb": [ + 165, + 90, + 50 + ], + "size": 35, + "initial_center": [ + 687, + 666 + ], + "target_center": [ + 256, + 914 + ] + }, + { + "symbol": "animal_5", + "index": 5, + "id": "coral_bear_1", + "type": "bear", + "color_name": "coral", + "color_rgb": [ + 255, + 127, + 80 + ], + "size": 35, + "initial_center": [ + 854, + 254 + ], + "target_center": [ + 838, + 914 + ] + } + ], + "containers": [ + { + "symbol": "container_0", + "index": 0, + "color_name": "brown", + "color_rgb": [ + 165, + 90, + 50 + ], + "rect": [ + 151, + 874, + 140, + 120 + ], + "center": [ + 221, + 934 + ] + }, + { + "symbol": "container_1", + "index": 1, + "color_name": "pink", + "color_rgb": [ + 255, + 105, + 180 + ], + "rect": [ + 442, + 874, + 140, + 120 + ], + "center": [ + 512, + 934 + ] + }, + { + "symbol": "container_2", + "index": 2, + "color_name": "coral", + "color_rgb": [ + 255, + 127, + 80 + ], + "rect": [ + 733, + 874, + 140, + 120 + ], + "center": [ + 803, + 934 + ] + } + ] + }, + "param_hash": "5dbea7c160c50f62", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/prompt.txt b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c37e147c4e187416654e751dae44c3a32960f139 --- /dev/null +++ b/VBVR-Dataset/O-6_animal_color_sorting_task/O-6_animal_color_sorting_00000002/prompt.txt @@ -0,0 +1 @@ +Colored animal faces are scattered at the top of the canvas, and containers with colored borders are at the bottom. Sort each animal into the container with the matching border color. \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/final_frame.png b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c183efe756d9c8d7a5e04bc866bd23765d715fb6 Binary files /dev/null and b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/final_frame.png differ diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/first_frame.png b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6d7730752c81faf387174a4586e801d92b4085d6 Binary files /dev/null and b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/first_frame.png differ diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/ground_truth.mp4 b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..527d841ace12cb2877bf46749065e873e8d4bb8c --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c84c6f21ef8cfa8d5fb8ca057defe7ed2b79ad8df3598d4f5d3ffe97d6ff69 +size 154921 diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/metadata.json b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1f4f2c9dd99d581f560b238d574391bf5d0bc5e6 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/metadata.json @@ -0,0 +1,50 @@ +{ + "task_id": "attention_shift_different_00000000", + "generator": "attention_shift_different", + "timestamp": "2026-02-17T07:25:38.230177", + "parameters": { + "objects": [ + { + "shape": "hexagon", + "color": [ + 68, + 220, + 192 + ], + "size": 110, + "angle": -23, + "center": [ + 247.864022, + 512.0 + ] + }, + { + "shape": "triangle", + "color": [ + 163, + 140, + 93 + ], + "size": 166, + "angle": 3, + "center": [ + 764.446601, + 512.0 + ] + } + ], + "start_index": 0, + "end_index": 1, + "direction": "left_to_right" + }, + "param_hash": "b104eed1057f500e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/prompt.txt b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0726d84d7e1f3ccdea3524e7549bf20feca8a479 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows two objects, one on the left and one on the right, with a green attention box around the left object. The objects remain stationary and unchanged throughout. Move the green attention box from the left object to the right object. \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/final_frame.png b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..841c11473bacf7cd3e137712eecd0c14e776b4ad Binary files /dev/null and b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/final_frame.png differ diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/first_frame.png b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..789d3272b75ce69ce6d82d622080dd6e6fc802cd Binary files /dev/null and b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/first_frame.png differ diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/ground_truth.mp4 b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6353de6dcb3cab72b2d484e053c8bd9aafdb43b5 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035a60637d6a1414dc002d5fe99ad6b12836b2387698d86155689eebef8a8ecf +size 177506 diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/metadata.json b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d6158404e6c0cb076f071b564f8e3e2e7e96e054 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/metadata.json @@ -0,0 +1,50 @@ +{ + "task_id": "attention_shift_different_00000001", + "generator": "attention_shift_different", + "timestamp": "2026-02-17T07:25:38.618957", + "parameters": { + "objects": [ + { + "shape": "triangle", + "color": [ + 93, + 140, + 134 + ], + "size": 163, + "angle": -33, + "center": [ + 264.082868, + 512.0 + ] + }, + { + "shape": "triangle", + "color": [ + 233, + 231, + 145 + ], + "size": 151, + "angle": 18, + "center": [ + 766.712906, + 512.0 + ] + } + ], + "start_index": 1, + "end_index": 0, + "direction": "right_to_left" + }, + "param_hash": "68df91201c2e10ec", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/prompt.txt b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a13f0b56b5cc81266a1692644ac3bba42b1c4177 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows two objects, one on the left and one on the right, with a green attention box around the right object. The objects remain stationary and unchanged throughout. Move the green attention box from the right object to the left object. \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/final_frame.png b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..eaac498f0e5e3d51c556c907f1b079f17e14eb48 Binary files /dev/null and b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/final_frame.png differ diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/first_frame.png b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f990750603b8723dcde237da1b044aa551c3220b Binary files /dev/null and b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/first_frame.png differ diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/ground_truth.mp4 b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cd802cf4675cb48daf6af5527600109f551cb548 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6fef7f0589c2164b6a99032800278a14a42612a8d745e04586faca040b2a9d +size 168285 diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/metadata.json b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..258e3712664efa47dd7ae8d434d299e1ca4f95a2 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/metadata.json @@ -0,0 +1,50 @@ +{ + "task_id": "attention_shift_different_00000002", + "generator": "attention_shift_different", + "timestamp": "2026-02-17T07:25:39.002384", + "parameters": { + "objects": [ + { + "shape": "hexagon", + "color": [ + 247, + 55, + 191 + ], + "size": 128, + "angle": 9, + "center": [ + 279.338095, + 512.0 + ] + }, + { + "shape": "circle", + "color": [ + 174, + 105, + 128 + ], + "size": 99, + "angle": -33, + "center": [ + 740.211457, + 512.0 + ] + } + ], + "start_index": 1, + "end_index": 0, + "direction": "right_to_left" + }, + "param_hash": "1e1a086b19490ccd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/prompt.txt b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a13f0b56b5cc81266a1692644ac3bba42b1c4177 --- /dev/null +++ b/VBVR-Dataset/attention_shift_different_task/attention_shift_different_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows two objects, one on the left and one on the right, with a green attention box around the right object. The objects remain stationary and unchanged throughout. Move the green attention box from the right object to the left object. \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/final_frame.png b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..caad206263cdad716a6ae82e006d27e92c25d560 Binary files /dev/null and b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/final_frame.png differ diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/first_frame.png b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..735fa9ca5a497941988b4b542c93ce49a2021ef5 Binary files /dev/null and b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/first_frame.png differ diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/ground_truth.mp4 b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0c434d81944d7ee5aa73ea8846535509aae0bb2e --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0675f1526006225705b3d93569d1cfe4a6739fcca53518344707b4fa60a45488 +size 200428 diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/metadata.json b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..11bdcd701e84fbf8ac7f1c825b57fa72c82fc1e2 --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/metadata.json @@ -0,0 +1,26 @@ +{ + "task_id": "attention_shift_same_00000000", + "generator": "attention_shift_same", + "timestamp": "2026-02-17T07:14:26.074360", + "parameters": { + "shape": "square", + "color": [ + 240, + 200, + 100 + ], + "size": 74, + "angle": 25, + "direction": "right_to_left" + }, + "param_hash": "e186f1c0fa466eb2", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/prompt.txt b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..74ff53a7ce40dfde7e5bc2838e8dd183548b2ede --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows two identical square objects, one on the left and one on the right, with a green attention box around the right object. The square objects remain stationary and unchanged throughout. Move the green attention box from the right object to the left object. \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/final_frame.png b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c05cf7386148bc3d380a7696c29e3db37686232a Binary files /dev/null and b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/final_frame.png differ diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/first_frame.png b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7e59725cd1c2d523fd2ffa80be1cb478b5fa8e47 Binary files /dev/null and b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/first_frame.png differ diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/ground_truth.mp4 b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0c811677d645498172bc5c64b0fa3629fca58fc1 --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45288e8aee2f9759f585de7c7c4b71fdb943befb364c1888f734d234322ab59c +size 135672 diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/metadata.json b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b5c82572c83622eb10d3c1f56856d12edcd1adee --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/metadata.json @@ -0,0 +1,26 @@ +{ + "task_id": "attention_shift_same_00000001", + "generator": "attention_shift_same", + "timestamp": "2026-02-17T07:14:26.427028", + "parameters": { + "shape": "diamond", + "color": [ + 100, + 200, + 150 + ], + "size": 80, + "angle": 0, + "direction": "right_to_left" + }, + "param_hash": "b0997df8e575a34e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/prompt.txt b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d201418356b30c3e9e042fe22ed1597638be4233 --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows two identical diamond objects, one on the left and one on the right, with a green attention box around the right object. The diamond objects remain stationary and unchanged throughout. Move the green attention box from the right object to the left object. \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/final_frame.png b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f942aae354e73ac87f195e2aff7a1ff6852905ed Binary files /dev/null and b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/final_frame.png differ diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/first_frame.png b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..84e26b1d4b87e2f89449d02f6a2156277de8b833 Binary files /dev/null and b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/first_frame.png differ diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/ground_truth.mp4 b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..16c2b6994abf29e99ca7f41a1c8c1cafeb18e2a7 --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b252c4aa4d4a6effb484d8917ed49d780e90ea34162580a6e90b4843d2c66ec4 +size 154041 diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/metadata.json b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1cf5f3bc5bdf9556225669af5e1ed67149962147 --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/metadata.json @@ -0,0 +1,26 @@ +{ + "task_id": "attention_shift_same_00000000", + "generator": "attention_shift_same", + "timestamp": "2026-02-17T07:14:31.093731", + "parameters": { + "shape": "hexagon", + "color": [ + 120, + 255, + 255 + ], + "size": 87, + "angle": 5, + "direction": "left_to_right" + }, + "param_hash": "dcf71903e3e64a6d", + "generation": { + "seed": 1438678513, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/prompt.txt b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..beb163559788f4ed40834fade3ab0bf0e27faee2 --- /dev/null +++ b/VBVR-Dataset/attention_shift_same_task/attention_shift_same_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows two identical hexagon objects, one on the left and one on the right, with a green attention box around the left object. The hexagon objects remain stationary and unchanged throughout. Move the green attention box from the left object to the right object. \ No newline at end of file diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/final_frame.png b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d3fc0c7d4602af13cfdc24c5bb8a24498f18df40 Binary files /dev/null and b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/final_frame.png differ diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/first_frame.png b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3c3deecd166d02c3d70d7289810a562e1745eb3b Binary files /dev/null and b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/first_frame.png differ diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/ground_truth.mp4 b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7b54b2f3863645a4456fd2e3b650ca9ed0ac0b73 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36f8d59821b3181f41446a022e7be990e0ceb4a8a305fd2a441f72f3a9ca926 +size 278432 diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/metadata.json b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f8e38ba6080ad64152ea87f3198ef9c8c40dedfa --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "ball_bounces_given_time_00000000", + "generator": "ball_bounces_given_time", + "timestamp": "2026-02-17T07:39:08.306875", + "parameters": { + "num_bounces": 4, + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 747.100549, + 804.89009 + ], + "final_center": [ + 871.196665, + 90 + ], + "color": [ + 255, + 192, + 203 + ], + "radius": 30, + "direction": -2.110163 + } + ] + }, + "param_hash": "e9c05fc61e332a54", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/prompt.txt b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a1e79ac6c723c5804d1f583c498826aadf42ba20 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000000/prompt.txt @@ -0,0 +1 @@ +A ball is placed at the initial position with a direction arrow indicating its movement direction. Simulate the ball bouncing 4 times off the boundary walls following elastic collision physics (angle of incidence equals angle of reflection). The ball stops after the 4th bounce, with its final position at the wall where the last collision occurs. \ No newline at end of file diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/final_frame.png b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..882cf7bcabc3058ba2bb230adcd34f6fc5c131b0 Binary files /dev/null and b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/final_frame.png differ diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/first_frame.png b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2b5adac8e680e9198ab8dce1e2c1f8dc2ac7138e Binary files /dev/null and b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/first_frame.png differ diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/ground_truth.mp4 b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..733f3ca1dc4d55ea7af68c586fbdea148097b341 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e42ae08b8ae96f2ee77f8f1a3ec0df9f331dc3b04dc18f0ce760be85adfccb +size 332786 diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/metadata.json b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f4eacfce94489fcd2dd7519af114b1e22de6d271 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "ball_bounces_given_time_00000001", + "generator": "ball_bounces_given_time", + "timestamp": "2026-02-17T07:39:09.187593", + "parameters": { + "num_bounces": 6, + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 465.444301, + 232.966867 + ], + "final_center": [ + 934, + 452.863245 + ], + "color": [ + 128, + 128, + 0 + ], + "radius": 30, + "direction": -0.130819 + } + ] + }, + "param_hash": "2d3352b060cabb8e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/prompt.txt b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e04ca305e5ae66ddfebcf4c962fe9c904af6c2f --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000001/prompt.txt @@ -0,0 +1 @@ +A ball is placed at the initial position with a direction arrow indicating its movement direction. Simulate the ball bouncing 6 times off the boundary walls following elastic collision physics (angle of incidence equals angle of reflection). The ball stops after the 6th bounce, with its final position at the wall where the last collision occurs. \ No newline at end of file diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/final_frame.png b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d12f283939052afd607c9ecca58771758655da0e Binary files /dev/null and b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/final_frame.png differ diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/first_frame.png b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3a6c46de22e3a59b220aa48586b06538ee43c681 Binary files /dev/null and b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/first_frame.png differ diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/ground_truth.mp4 b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d38501048350cc1ac9ae118c3e015075fbcbb095 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce362acc0970e682f648c0631515372e8ad28cfc15e2caa010afb77761d5ad0 +size 219931 diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/metadata.json b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..948e03d92a9e63a94c845716c7d7c17742303b15 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "ball_bounces_given_time_00000002", + "generator": "ball_bounces_given_time", + "timestamp": "2026-02-17T07:39:09.833675", + "parameters": { + "num_bounces": 2, + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 607.634246, + 354.401745 + ], + "final_center": [ + 924.644085, + 90 + ], + "color": [ + 210, + 105, + 30 + ], + "radius": 30, + "direction": -0.667111 + } + ] + }, + "param_hash": "bd06cd7ff578c4db", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/prompt.txt b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..437ad28c7420ab4f1d0ddad50e120f76385ee8b9 --- /dev/null +++ b/VBVR-Dataset/ball_bounces_given_time_task/ball_bounces_given_time_00000002/prompt.txt @@ -0,0 +1 @@ +A ball is placed at the initial position with a direction arrow indicating its movement direction. Simulate the ball bouncing 2 times off the boundary walls following elastic collision physics (angle of incidence equals angle of reflection). The ball stops after the 2th bounce, with its final position at the wall where the last collision occurs. \ No newline at end of file diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000000/final_frame.png b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ca98ba5c4b0f492f57ce860a18ec0dc65712fb79 Binary files /dev/null and b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/final_frame.png differ diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000000/first_frame.png b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..452b8e2e7573f918800217e4a436bc01e6b21730 Binary files /dev/null and b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/first_frame.png differ diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000000/ground_truth.mp4 b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..49dd627a6eff910f40c2c22c6e6e6b821c0f5d61 --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af871a1aa79b2849488fd3d3a946c93968dcd2e77ca1577839e5cfbe5d05a66d +size 412719 diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000000/metadata.json b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4b54201d7b72d4afae7b12a2eb6b6000cdf407fd --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/metadata.json @@ -0,0 +1,98 @@ +{ + "task_id": "ball_eating_00000000", + "generator": "ball_eating", + "timestamp": "2026-02-17T07:47:17.949923", + "parameters": { + "growth_factor": 1.5, + "eating_sequence": [ + 0, + 1, + 2 + ], + "objects": [ + { + "symbol": "ball", + "type": "predator", + "color": [ + 0, + 0, + 0 + ], + "initial_size": 84.27, + "initial_center": [ + 742.95, + 461.27 + ], + "final_size": 284.41, + "final_center": [ + 201.39, + 316.16 + ] + }, + { + "symbol": "ball", + "type": "prey", + "id": 0, + "color": [ + 70, + 130, + 180 + ], + "color_name": "blue", + "size": 53.8, + "center": [ + 197.86, + 141.03 + ], + "is_eaten": true, + "eaten_order": 0 + }, + { + "symbol": "ball", + "type": "prey", + "id": 1, + "color": [ + 60, + 179, + 113 + ], + "color_name": "green", + "size": 115.33, + "center": [ + 937.83, + 621.26 + ], + "is_eaten": true, + "eaten_order": 1 + }, + { + "symbol": "ball", + "type": "prey", + "id": 2, + "color": [ + 255, + 215, + 0 + ], + "color_name": "yellow", + "size": 143.33, + "center": [ + 201.39, + 316.16 + ], + "is_eaten": true, + "eaten_order": 2 + } + ] + }, + "param_hash": "8077a14ace446824", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000000/prompt.txt b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..22e2c0a4fac2515292ba01e87e6fd3292dfd8063 --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000000/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a black ball and several colored balls of different sizes. The black ball can eat balls that are smaller than itself. After eating a ball, the black ball grows larger. Find the correct sequence to eat all colored balls step by step. \ No newline at end of file diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000001/final_frame.png b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f9a8a3030f8ae8f109b589c2388fdc84b51ee795 Binary files /dev/null and b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/final_frame.png differ diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000001/first_frame.png b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..436e1d04c149dd54c548473bd713c9487b5f1c4e Binary files /dev/null and b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/first_frame.png differ diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000001/ground_truth.mp4 b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f6685f0a2d2bf04de6894bfb20d38945769c6f0d --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207b2fdfac3d2a8701f1afce965f30100fe1367828bc5b3a2c5955af1930f07a +size 211697 diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000001/metadata.json b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..99e9da5a028d518e17b8d68d21411c27c7d1bc30 --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "ball_eating_00000001", + "generator": "ball_eating", + "timestamp": "2026-02-17T07:47:18.902612", + "parameters": { + "growth_factor": 1.5, + "eating_sequence": [ + 0, + 1 + ], + "objects": [ + { + "symbol": "ball", + "type": "predator", + "color": [ + 0, + 0, + 0 + ], + "initial_size": 64.2, + "initial_center": [ + 270.4, + 650.94 + ], + "final_size": 144.46, + "final_center": [ + 238.44, + 371.7 + ] + }, + { + "symbol": "ball", + "type": "prey", + "id": 0, + "color": [ + 255, + 140, + 0 + ], + "color_name": "orange", + "size": 57.03, + "center": [ + 354.89, + 586.39 + ], + "is_eaten": true, + "eaten_order": 0 + }, + { + "symbol": "ball", + "type": "prey", + "id": 1, + "color": [ + 220, + 20, + 60 + ], + "color_name": "red", + "size": 73.47, + "center": [ + 238.44, + 371.7 + ], + "is_eaten": true, + "eaten_order": 1 + } + ] + }, + "param_hash": "98299bfd50bf7375", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000001/prompt.txt b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..22e2c0a4fac2515292ba01e87e6fd3292dfd8063 --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000001/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a black ball and several colored balls of different sizes. The black ball can eat balls that are smaller than itself. After eating a ball, the black ball grows larger. Find the correct sequence to eat all colored balls step by step. \ No newline at end of file diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000002/final_frame.png b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e7364738d7f063c0262229a0873045438eb3867d Binary files /dev/null and b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/final_frame.png differ diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000002/first_frame.png b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6cc07076877dae1286c1bfbae12825b3c6060bf1 Binary files /dev/null and b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/first_frame.png differ diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000002/ground_truth.mp4 b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..441a3c45da20d0a784403cd00b05809af94fb4d9 --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce0377e985b12b7ae2211dfed4cf80ccc395fae32a061252d50e998b4ba3921 +size 255991 diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000002/metadata.json b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dc1f33a21f9c74ebae17360f0722939829ec449c --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/metadata.json @@ -0,0 +1,98 @@ +{ + "task_id": "ball_eating_00000002", + "generator": "ball_eating", + "timestamp": "2026-02-17T07:47:19.817383", + "parameters": { + "growth_factor": 1.5, + "eating_sequence": [ + 0, + 1, + 2 + ], + "objects": [ + { + "symbol": "ball", + "type": "predator", + "color": [ + 0, + 0, + 0 + ], + "initial_size": 51.7, + "initial_center": [ + 435.98, + 719.64 + ], + "final_size": 174.49, + "final_center": [ + 780.57, + 509.79 + ] + }, + { + "symbol": "ball", + "type": "prey", + "id": 0, + "color": [ + 255, + 215, + 0 + ], + "color_name": "yellow", + "size": 45.13, + "center": [ + 712.48, + 691.74 + ], + "is_eaten": true, + "eaten_order": 0 + }, + { + "symbol": "ball", + "type": "prey", + "id": 1, + "color": [ + 147, + 112, + 219 + ], + "color_name": "purple", + "size": 71.68, + "center": [ + 586.28, + 619.83 + ], + "is_eaten": true, + "eaten_order": 1 + }, + { + "symbol": "ball", + "type": "prey", + "id": 2, + "color": [ + 255, + 215, + 0 + ], + "color_name": "yellow", + "size": 104.69, + "center": [ + 780.57, + 509.79 + ], + "is_eaten": true, + "eaten_order": 2 + } + ] + }, + "param_hash": "07b3dcba76982689", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_eating_task/ball_eating_00000002/prompt.txt b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..22e2c0a4fac2515292ba01e87e6fd3292dfd8063 --- /dev/null +++ b/VBVR-Dataset/ball_eating_task/ball_eating_00000002/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a black ball and several colored balls of different sizes. The black ball can eat balls that are smaller than itself. After eating a ball, the black ball grows larger. Find the correct sequence to eat all colored balls step by step. \ No newline at end of file diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/final_frame.png b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7f0c04c106703a058fbccc2cfa7653c2cd6dd932 Binary files /dev/null and b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/final_frame.png differ diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/first_frame.png b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f125f0448c8fa85531baef2138584d7097d4ae34 Binary files /dev/null and b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/first_frame.png differ diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/ground_truth.mp4 b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cfe2bbeaafb6898645b505554231b070587d838c --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e200f9ac910f3b80dfce814330aa36fbd969c64c197e96f955d12b37c2b10551 +size 286379 diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/metadata.json b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..82f993914f27a5bb345e25204b19fdc097115adc --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/metadata.json @@ -0,0 +1,88 @@ +{ + "task_id": "ball_prediction_00000000", + "generator": "ball_prediction", + "timestamp": "2026-02-17T07:23:23.836952", + "parameters": { + "ball_x": 269, + "ball_y": 230, + "ball_color": [ + 255, + 192, + 203 + ], + "angle": 15.168263, + "circles": [ + { + "id": 1, + "position": [ + 614, + 256 + ] + }, + { + "id": 2, + "position": [ + 661, + 303 + ] + }, + { + "id": 3, + "position": [ + 708, + 350 + ] + }, + { + "id": 4, + "position": [ + 755, + 397 + ] + }, + { + "id": 5, + "position": [ + 802, + 444 + ] + }, + { + "id": 6, + "position": [ + 849, + 491 + ] + } + ], + "target_circle": 1, + "bounce_points": [ + [ + 269, + 230 + ], + [ + 630.491192, + 132 + ], + [ + 892, + 202.774372 + ], + [ + 614, + 256 + ] + ] + }, + "param_hash": "27c908c4dee2f4ac", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/prompt.txt b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8f5efc24832387bf4a815f2f5af4f9ae75a651c --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a ball with an arrow indicating its initial direction, and several empty target positions (hollow circles) on the right side. Simulate the ball moving along this direction and bouncing off walls following the law of reflection (the angle of reflection equals the angle of incidence). The ball will follow a complete trajectory and eventually align exactly with and completely overlap one of the target positions. \ No newline at end of file diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/final_frame.png b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e60f21450cfd6956b498a048f9bcf7959288d664 Binary files /dev/null and b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/final_frame.png differ diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/first_frame.png b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7eb9d08209a2694c0c8683625fb80bf683ff32e8 Binary files /dev/null and b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/first_frame.png differ diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/ground_truth.mp4 b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7d35cdb633e4977d3b3a37aff410873246570cf3 --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1ba03cf33b6c6026a73ea174d4797d67dd19604bd95c8559d9bd828dacbbb4 +size 262571 diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/metadata.json b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..64ab0d41cae2e68120509a2bf979238e8728edf2 --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/metadata.json @@ -0,0 +1,66 @@ +{ + "task_id": "ball_prediction_00000001", + "generator": "ball_prediction", + "timestamp": "2026-02-17T07:23:24.773258", + "parameters": { + "ball_x": 245, + "ball_y": 494, + "ball_color": [ + 128, + 128, + 0 + ], + "angle": 21.857442, + "circles": [ + { + "id": 1, + "position": [ + 614, + 256 + ] + }, + { + "id": 2, + "position": [ + 661, + 303 + ] + }, + { + "id": 3, + "position": [ + 708, + 350 + ] + }, + { + "id": 4, + "position": [ + 755, + 397 + ] + } + ], + "target_circle": 2, + "bounce_points": [ + [ + 245, + 494 + ], + [ + 661, + 303 + ] + ] + }, + "param_hash": "9325885f51a4470d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/prompt.txt b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8f5efc24832387bf4a815f2f5af4f9ae75a651c --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a ball with an arrow indicating its initial direction, and several empty target positions (hollow circles) on the right side. Simulate the ball moving along this direction and bouncing off walls following the law of reflection (the angle of reflection equals the angle of incidence). The ball will follow a complete trajectory and eventually align exactly with and completely overlap one of the target positions. \ No newline at end of file diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/final_frame.png b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..115ea361df7b08343569ef08d5200315875af196 Binary files /dev/null and b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/final_frame.png differ diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/first_frame.png b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4a4cb173acae0406cdd5bc2bcb26cf451755cae5 Binary files /dev/null and b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/first_frame.png differ diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/ground_truth.mp4 b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..39008b4e0107bae77d20bf141372257261eec773 --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265ceb51eb5fd8babd6ee896c15ffdef6bcf7c17bbd8e62a6b809567fb723899 +size 314554 diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/metadata.json b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..05db950dc33d6023890833432416fab06a4bff0e --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "ball_prediction_00000002", + "generator": "ball_prediction", + "timestamp": "2026-02-17T07:23:25.702374", + "parameters": { + "ball_x": 133, + "ball_y": 265, + "ball_color": [ + 72, + 61, + 139 + ], + "angle": 11.709579, + "circles": [ + { + "id": 1, + "position": [ + 614, + 256 + ] + }, + { + "id": 2, + "position": [ + 661, + 303 + ] + }, + { + "id": 3, + "position": [ + 708, + 350 + ] + }, + { + "id": 4, + "position": [ + 755, + 397 + ] + }, + { + "id": 5, + "position": [ + 802, + 444 + ] + } + ], + "target_circle": 5, + "bounce_points": [ + [ + 133, + 265 + ], + [ + 774.692431, + 132 + ], + [ + 892, + 155.366021 + ], + [ + 132, + 313.875068 + ], + [ + 802, + 444 + ] + ] + }, + "param_hash": "7f01381399618679", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/prompt.txt b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d8f5efc24832387bf4a815f2f5af4f9ae75a651c --- /dev/null +++ b/VBVR-Dataset/ball_prediction_task/ball_prediction_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a ball with an arrow indicating its initial direction, and several empty target positions (hollow circles) on the right side. Simulate the ball moving along this direction and bouncing off walls following the law of reflection (the angle of reflection equals the angle of incidence). The ball will follow a complete trajectory and eventually align exactly with and completely overlap one of the target positions. \ No newline at end of file diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000000/._ground_truth.mp4 b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/._ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..00840b599972f36a23233798076291d2371dbc4f Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/._ground_truth.mp4 differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000000/final_frame.png b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2087a7596050b431e18c4fcf403ed109a016e77f Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/final_frame.png differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000000/first_frame.png b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..855550e9bc3aef4bbc644dbb1dd7a55d0f079df1 Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/first_frame.png differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000000/ground_truth.mp4 b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..934ee4101ca7c2af73f440dab92f6719b42deacf --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98e3366f3a16225ff46cfa1459ef20c5817b0feb1efa726ed9120e2d5aae7aff +size 117557 diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000000/metadata.json b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..70ede23b94c65dca42683c70da5d80e4ccc6215f --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "ballcolor_00000000", + "generator": "ballcolor", + "timestamp": "2026-02-26T09:54:23.983438", + "parameters": { + "total_count": 6, + "red_cluster_idx": 0, + "merge_sequence": [ + { + "from": 0, + "to": 1, + "from_color": "red", + "to_color": "violet", + "color_after": "red", + "from_size": 4, + "to_size": 2, + "final_size": 6, + "target_id_letter": "B" + } + ], + "objects": [ + { + "symbol": "cluster", + "cluster_id": 0, + "cluster_id_letter": "A", + "color": "red", + "color_rgb": [ + 255, + 50, + 50 + ], + "initial_size": 4, + "initial_center": [ + 631.45, + 157.27 + ], + "final_size": 6, + "final_center": [ + 540.63, + 577.69 + ], + "is_red": true, + "is_absorbed": false, + "ball_radius": 26 + }, + { + "symbol": "cluster", + "cluster_id": 1, + "cluster_id_letter": "B", + "color": "violet", + "color_rgb": [ + 238, + 130, + 238 + ], + "initial_size": 2, + "initial_center": [ + 540.63, + 577.69 + ], + "final_size": 0, + "final_center": null, + "is_red": false, + "is_absorbed": true, + "ball_radius": 26 + } + ] + }, + "param_hash": "bae3f79a19485fe0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000000/prompt.txt b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..74f0498efa722779803e1897390f183d07592593 --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000000/prompt.txt @@ -0,0 +1 @@ +In the scene, there are 2 ball clusters: red cluster A has 4 balls, and there are other clusters with different numbers of balls. The global TOTAL label shows the sum 6. Control the red cluster A to absorb other clusters. You can only absorb clusters that are smaller than the red cluster. Find the correct sequence to absorb all clusters step by step until all balls become red. \ No newline at end of file diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000001/final_frame.png b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..abd26c5d2941fa7c5ca59fb0c43ad4b5b69b95b1 Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/final_frame.png differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000001/first_frame.png b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fc3b36b0c643a29c7196069f026690d339652fba Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/first_frame.png differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000001/ground_truth.mp4 b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7d9f49ce4c3449c2271cac3d66c84b250a4c48ed --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:670eab544441df6cabedf6a5d302c514e1c9a57866076e127a4733e887a1565e +size 385189 diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000001/metadata.json b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f983cbcda7b98965e25dedd7473d7f14188e2a8b --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/metadata.json @@ -0,0 +1,111 @@ +{ + "task_id": "ballcolor_00000001", + "generator": "ballcolor", + "timestamp": "2026-02-26T09:54:24.781973", + "parameters": { + "total_count": 20, + "red_cluster_idx": 0, + "merge_sequence": [ + { + "from": 0, + "to": 1, + "from_color": "red", + "to_color": "navy", + "color_after": "red", + "from_size": 9, + "to_size": 3, + "final_size": 12, + "target_id_letter": "B" + }, + { + "from": 0, + "to": 2, + "from_color": "red", + "to_color": "turquoise", + "color_after": "red", + "from_size": 12, + "to_size": 8, + "final_size": 20, + "target_id_letter": "C" + } + ], + "objects": [ + { + "symbol": "cluster", + "cluster_id": 0, + "cluster_id_letter": "A", + "color": "red", + "color_rgb": [ + 255, + 50, + 50 + ], + "initial_size": 9, + "initial_center": [ + 857.5, + 138.37 + ], + "final_size": 20, + "final_center": [ + 850.48, + 608.26 + ], + "is_red": true, + "is_absorbed": false, + "ball_radius": 27 + }, + { + "symbol": "cluster", + "cluster_id": 1, + "cluster_id_letter": "B", + "color": "navy", + "color_rgb": [ + 0, + 0, + 128 + ], + "initial_size": 3, + "initial_center": [ + 501.78, + 360.94 + ], + "final_size": 0, + "final_center": null, + "is_red": false, + "is_absorbed": true, + "ball_radius": 27 + }, + { + "symbol": "cluster", + "cluster_id": 2, + "cluster_id_letter": "C", + "color": "turquoise", + "color_rgb": [ + 64, + 224, + 208 + ], + "initial_size": 8, + "initial_center": [ + 850.48, + 608.26 + ], + "final_size": 0, + "final_center": null, + "is_red": false, + "is_absorbed": true, + "ball_radius": 27 + } + ] + }, + "param_hash": "fb18d9c871b60869", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000001/prompt.txt b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f31a48cf2d4387a6679b55e1067b1af1ff4c4fc --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000001/prompt.txt @@ -0,0 +1 @@ +In the scene, there are 3 ball clusters: red cluster A has 9 balls, and there are other clusters with different numbers of balls. The global TOTAL label shows the sum 20. Control the red cluster A to absorb other clusters. You can only absorb clusters that are smaller than the red cluster. Find the correct sequence to absorb all clusters step by step until all balls become red. \ No newline at end of file diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000002/final_frame.png b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..956a71ebf2e38710dc8233df784c7a4f9a79c8ce Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/final_frame.png differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000002/first_frame.png b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f3d582204d0434b12ac917a4289ba52c73fecab3 Binary files /dev/null and b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/first_frame.png differ diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000002/ground_truth.mp4 b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b39281f61ad20b35ff80b59a974b4f8adeef49e9 --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd9225502892925eff9223ff4f8eade501bb4fe41ace108296bb0a5f01a37be +size 536809 diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000002/metadata.json b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dfcc6a9106f8afa3e8dd2f5cf671c2cdd4fe3848 --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/metadata.json @@ -0,0 +1,111 @@ +{ + "task_id": "ballcolor_00000002", + "generator": "ballcolor", + "timestamp": "2026-02-26T09:54:25.586595", + "parameters": { + "total_count": 25, + "red_cluster_idx": 0, + "merge_sequence": [ + { + "from": 0, + "to": 1, + "from_color": "red", + "to_color": "navy", + "color_after": "red", + "from_size": 11, + "to_size": 4, + "final_size": 15, + "target_id_letter": "B" + }, + { + "from": 0, + "to": 2, + "from_color": "red", + "to_color": "indigo", + "color_after": "red", + "from_size": 15, + "to_size": 10, + "final_size": 25, + "target_id_letter": "C" + } + ], + "objects": [ + { + "symbol": "cluster", + "cluster_id": 0, + "cluster_id_letter": "A", + "color": "red", + "color_rgb": [ + 255, + 50, + 50 + ], + "initial_size": 11, + "initial_center": [ + 457.43, + 392.49 + ], + "final_size": 25, + "final_center": [ + 542.33, + 803.15 + ], + "is_red": true, + "is_absorbed": false, + "ball_radius": 23 + }, + { + "symbol": "cluster", + "cluster_id": 1, + "cluster_id_letter": "B", + "color": "navy", + "color_rgb": [ + 0, + 0, + 128 + ], + "initial_size": 4, + "initial_center": [ + 256.68, + 140.69 + ], + "final_size": 0, + "final_center": null, + "is_red": false, + "is_absorbed": true, + "ball_radius": 23 + }, + { + "symbol": "cluster", + "cluster_id": 2, + "cluster_id_letter": "C", + "color": "indigo", + "color_rgb": [ + 75, + 0, + 130 + ], + "initial_size": 10, + "initial_center": [ + 542.33, + 803.15 + ], + "final_size": 0, + "final_center": null, + "is_red": false, + "is_absorbed": true, + "ball_radius": 23 + } + ] + }, + "param_hash": "20c1e316f299d8ea", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ballcolor_task/ballcolor_00000002/prompt.txt b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..bdfea73f521aa74e2e185b8aed2c7dfeac8a6104 --- /dev/null +++ b/VBVR-Dataset/ballcolor_task/ballcolor_00000002/prompt.txt @@ -0,0 +1 @@ +In the scene, there are 3 ball clusters: red cluster A has 11 balls, and there are other clusters with different numbers of balls. The global TOTAL label shows the sum 25. Control the red cluster A to absorb other clusters. You can only absorb clusters that are smaller than the red cluster. Find the correct sequence to absorb all clusters step by step until all balls become red. \ No newline at end of file diff --git a/VBVR-Dataset/bfs_task/bfs_00000000/final_frame.png b/VBVR-Dataset/bfs_task/bfs_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8fbc49924aec5d6f43939bed4c413637dd5aec86 Binary files /dev/null and b/VBVR-Dataset/bfs_task/bfs_00000000/final_frame.png differ diff --git a/VBVR-Dataset/bfs_task/bfs_00000000/first_frame.png b/VBVR-Dataset/bfs_task/bfs_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e0f0ba5fdb771a258ab1ec319727e65ca9851140 Binary files /dev/null and b/VBVR-Dataset/bfs_task/bfs_00000000/first_frame.png differ diff --git a/VBVR-Dataset/bfs_task/bfs_00000000/ground_truth.mp4 b/VBVR-Dataset/bfs_task/bfs_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a41e63f6950818fa5f45e1ba139aa5a445a4fdd7 --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315dc6360bbb7cc87ae99658d371491e83166d723f0b7790de62ed5d58a79221 +size 151271 diff --git a/VBVR-Dataset/bfs_task/bfs_00000000/metadata.json b/VBVR-Dataset/bfs_task/bfs_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..07235480ca9491376d5c45466a781df407a151b2 --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000000/metadata.json @@ -0,0 +1,175 @@ +{ + "task_id": "bfs_00000000", + "generator": "bfs", + "timestamp": "2026-02-17T07:28:40.639420", + "parameters": { + "nodes": [ + { + "id": 0, + "level": 0, + "center": [ + 512.0, + 252.504625 + ] + }, + { + "id": 1, + "level": 1, + "center": [ + 240.824858, + 325.908625 + ] + }, + { + "id": 2, + "level": 1, + "center": [ + 317.991974, + 325.908625 + ] + }, + { + "id": 3, + "level": 1, + "center": [ + 486.371868, + 325.908625 + ] + }, + { + "id": 4, + "level": 1, + "center": [ + 659.229314, + 325.908625 + ] + }, + { + "id": 5, + "level": 2, + "center": [ + 225.703373, + 397.934376 + ] + }, + { + "id": 6, + "level": 2, + "center": [ + 304.448656, + 397.934376 + ] + }, + { + "id": 7, + "level": 2, + "center": [ + 512.802813, + 397.934376 + ] + }, + { + "id": 8, + "level": 2, + "center": [ + 812.842729, + 397.934376 + ] + }, + { + "id": 9, + "level": 3, + "center": [ + 470.900439, + 471.778356 + ] + }, + { + "id": 10, + "level": 3, + "center": [ + 844.839057, + 471.778356 + ] + }, + { + "id": 11, + "level": 4, + "center": [ + 496.180949, + 645.793004 + ] + }, + { + "id": 12, + "level": 4, + "center": [ + 630.450454, + 645.793004 + ] + } + ], + "edges": [ + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 0, + 3 + ], + [ + 0, + 4 + ], + [ + 1, + 5 + ], + [ + 2, + 6 + ], + [ + 3, + 7 + ], + [ + 4, + 8 + ], + [ + 5, + 9 + ], + [ + 6, + 10 + ], + [ + 9, + 11 + ], + [ + 10, + 12 + ] + ], + "start_id": 0, + "end_id": 11 + }, + "param_hash": "62082cc642668f25", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/bfs_task/bfs_00000000/prompt.txt b/VBVR-Dataset/bfs_task/bfs_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bb76feb388d7dda4326971634a9ba917b541fba --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a tree structure with nodes connected by edges, a green starting node at the top, a red ending node at the bottom, and a yellow smiley agent positioned at the green starting node. The agent can move along edges, visiting one node per step. Move the yellow smiley agent from the green starting node to the red ending node along the unique tree path, showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/bfs_task/bfs_00000001/final_frame.png b/VBVR-Dataset/bfs_task/bfs_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..51ddede8a62393290b048bd67b9cbe1da0771b34 Binary files /dev/null and b/VBVR-Dataset/bfs_task/bfs_00000001/final_frame.png differ diff --git a/VBVR-Dataset/bfs_task/bfs_00000001/first_frame.png b/VBVR-Dataset/bfs_task/bfs_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c3dafb730ad58372793a1c301105f2288ff5f8ab Binary files /dev/null and b/VBVR-Dataset/bfs_task/bfs_00000001/first_frame.png differ diff --git a/VBVR-Dataset/bfs_task/bfs_00000001/ground_truth.mp4 b/VBVR-Dataset/bfs_task/bfs_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c33c20a7d0db472ca5abb438f55d0ca0b6f677be --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75afb109fd2ce0a1db65136e6830a81b698d4daf7b13bb1dfd894396581ab8d0 +size 270891 diff --git a/VBVR-Dataset/bfs_task/bfs_00000001/metadata.json b/VBVR-Dataset/bfs_task/bfs_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5ca46ef1f0c31260e521170f66de542a825f0133 --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000001/metadata.json @@ -0,0 +1,235 @@ +{ + "task_id": "bfs_00000001", + "generator": "bfs", + "timestamp": "2026-02-17T07:28:41.082297", + "parameters": { + "nodes": [ + { + "id": 0, + "level": 0, + "center": [ + 512.0, + 262.300284 + ] + }, + { + "id": 1, + "level": 1, + "center": [ + 156.492784, + 324.498062 + ] + }, + { + "id": 2, + "level": 1, + "center": [ + 387.473762, + 324.498062 + ] + }, + { + "id": 3, + "level": 1, + "center": [ + 881.155227, + 324.498062 + ] + }, + { + "id": 4, + "level": 2, + "center": [ + 137.451871, + 459.987135 + ] + }, + { + "id": 5, + "level": 2, + "center": [ + 601.138291, + 459.987135 + ] + }, + { + "id": 6, + "level": 2, + "center": [ + 717.738083, + 459.987135 + ] + }, + { + "id": 7, + "level": 2, + "center": [ + 894.436776, + 459.987135 + ] + }, + { + "id": 8, + "level": 3, + "center": [ + 304.608169, + 514.310098 + ] + }, + { + "id": 9, + "level": 3, + "center": [ + 677.469954, + 514.310098 + ] + }, + { + "id": 10, + "level": 4, + "center": [ + 357.276836, + 580.747082 + ] + }, + { + "id": 11, + "level": 4, + "center": [ + 530.337184, + 580.747082 + ] + }, + { + "id": 12, + "level": 5, + "center": [ + 377.881873, + 682.964054 + ] + }, + { + "id": 13, + "level": 5, + "center": [ + 673.239716, + 682.964054 + ] + }, + { + "id": 14, + "level": 6, + "center": [ + 268.2016, + 856.867676 + ] + }, + { + "id": 15, + "level": 6, + "center": [ + 543.741594, + 856.867676 + ] + }, + { + "id": 16, + "level": 6, + "center": [ + 731.689658, + 856.867676 + ] + }, + { + "id": 17, + "level": 6, + "center": [ + 811.79084, + 856.867676 + ] + } + ], + "edges": [ + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 0, + 3 + ], + [ + 1, + 4 + ], + [ + 1, + 5 + ], + [ + 2, + 6 + ], + [ + 3, + 7 + ], + [ + 4, + 8 + ], + [ + 5, + 9 + ], + [ + 8, + 10 + ], + [ + 9, + 11 + ], + [ + 10, + 12 + ], + [ + 11, + 13 + ], + [ + 12, + 14 + ], + [ + 12, + 15 + ], + [ + 13, + 16 + ], + [ + 13, + 17 + ] + ], + "start_id": 0, + "end_id": 15 + }, + "param_hash": "22c885ca7f0dba2d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/bfs_task/bfs_00000001/prompt.txt b/VBVR-Dataset/bfs_task/bfs_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bb76feb388d7dda4326971634a9ba917b541fba --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a tree structure with nodes connected by edges, a green starting node at the top, a red ending node at the bottom, and a yellow smiley agent positioned at the green starting node. The agent can move along edges, visiting one node per step. Move the yellow smiley agent from the green starting node to the red ending node along the unique tree path, showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/bfs_task/bfs_00000002/final_frame.png b/VBVR-Dataset/bfs_task/bfs_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e57a679f55d87e072c29124ec2f7a7c93025df8f Binary files /dev/null and b/VBVR-Dataset/bfs_task/bfs_00000002/final_frame.png differ diff --git a/VBVR-Dataset/bfs_task/bfs_00000002/first_frame.png b/VBVR-Dataset/bfs_task/bfs_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7f3b18c0b7c6aae3fcbbd35eabcd81edbde2b01e Binary files /dev/null and b/VBVR-Dataset/bfs_task/bfs_00000002/first_frame.png differ diff --git a/VBVR-Dataset/bfs_task/bfs_00000002/ground_truth.mp4 b/VBVR-Dataset/bfs_task/bfs_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..81b9843e239742c940faca744bba170304835147 --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1e23999e89992ac308a45a7bcaa52488fc89461c4aa2d1fa5c380a29d30936 +size 182223 diff --git a/VBVR-Dataset/bfs_task/bfs_00000002/metadata.json b/VBVR-Dataset/bfs_task/bfs_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fdd86235bfccdce3111f313fbbaffc638c82ad48 --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000002/metadata.json @@ -0,0 +1,187 @@ +{ + "task_id": "bfs_00000002", + "generator": "bfs", + "timestamp": "2026-02-17T07:28:41.360617", + "parameters": { + "nodes": [ + { + "id": 0, + "level": 0, + "center": [ + 512.0, + 142.801942 + ] + }, + { + "id": 1, + "level": 1, + "center": [ + 129.686902, + 277.642068 + ] + }, + { + "id": 2, + "level": 1, + "center": [ + 202.526678, + 277.642068 + ] + }, + { + "id": 3, + "level": 1, + "center": [ + 323.990349, + 277.642068 + ] + }, + { + "id": 4, + "level": 1, + "center": [ + 483.345585, + 277.642068 + ] + }, + { + "id": 5, + "level": 2, + "center": [ + 104.007221, + 547.09279 + ] + }, + { + "id": 6, + "level": 2, + "center": [ + 346.251194, + 547.09279 + ] + }, + { + "id": 7, + "level": 2, + "center": [ + 429.775629, + 547.09279 + ] + }, + { + "id": 8, + "level": 2, + "center": [ + 611.592383, + 547.09279 + ] + }, + { + "id": 9, + "level": 3, + "center": [ + 221.312601, + 632.869072 + ] + }, + { + "id": 10, + "level": 3, + "center": [ + 615.942006, + 632.869072 + ] + }, + { + "id": 11, + "level": 3, + "center": [ + 894.757687, + 632.869072 + ] + }, + { + "id": 12, + "level": 4, + "center": [ + 131.157114, + 755.936559 + ] + }, + { + "id": 13, + "level": 4, + "center": [ + 496.875311, + 755.936559 + ] + } + ], + "edges": [ + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 0, + 3 + ], + [ + 0, + 4 + ], + [ + 1, + 5 + ], + [ + 2, + 6 + ], + [ + 3, + 7 + ], + [ + 4, + 8 + ], + [ + 5, + 9 + ], + [ + 6, + 10 + ], + [ + 7, + 11 + ], + [ + 9, + 12 + ], + [ + 10, + 13 + ] + ], + "start_id": 0, + "end_id": 13 + }, + "param_hash": "3e9ea9bdca6eecd8", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/bfs_task/bfs_00000002/prompt.txt b/VBVR-Dataset/bfs_task/bfs_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bb76feb388d7dda4326971634a9ba917b541fba --- /dev/null +++ b/VBVR-Dataset/bfs_task/bfs_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a tree structure with nodes connected by edges, a green starting node at the top, a red ending node at the bottom, and a yellow smiley agent positioned at the green starting node. The agent can move along edges, visiting one node per step. Move the yellow smiley agent from the green starting node to the red ending node along the unique tree path, showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000000/final_frame.png b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..673cf4dfea11ad30e2a253d2e7e9ea3e9b5a45bf Binary files /dev/null and b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/final_frame.png differ diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000000/first_frame.png b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6c7e1170bfbb647766dd2cf2daefd1fe87afd4b6 Binary files /dev/null and b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/first_frame.png differ diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000000/ground_truth.mp4 b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..bc84e0114218d8abf583272e5cfd8339b73827f1 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f66cfe31fe5d346c3b52ca0159fad42479bdbe80bcccb79318245d99ae9b03 +size 445500 diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000000/metadata.json b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..2ee48760bb21993182012cfebd82f58b658f10f0 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/metadata.json @@ -0,0 +1,382 @@ +{ + "task_id": "bookshelf_00000000", + "generator": "bookshelf", + "timestamp": "2026-02-17T07:47:11.870318", + "parameters": { + "num_existing": 16, + "num_new": 5, + "objects": [ + { + "symbol": "book", + "type": "existing", + "height": 88.49, + "center": [ + 52.5, + 446.0 + ], + "position": 0, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 94.4, + "center": [ + 87.5, + 441.5 + ], + "position": 1, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 103.22, + "center": [ + 122.5, + 435.0 + ], + "position": 2, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 103.4, + "center": [ + 157.5, + 434.5 + ], + "position": 3, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 103.83, + "center": [ + 192.5, + 434.5 + ], + "position": 4, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 104.15, + "center": [ + 227.5, + 434.0 + ], + "position": 5, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 109.85, + "center": [ + 262.5, + 430.0 + ], + "position": 6, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 111.81, + "center": [ + 367.5, + 428.5 + ], + "position": 9, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 135.73, + "center": [ + 472.5, + 410.5 + ], + "position": 12, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 139.5, + "center": [ + 507.5, + 407.5 + ], + "position": 13, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 141.18, + "center": [ + 542.5, + 406.5 + ], + "position": 14, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 142.29, + "center": [ + 612.5, + 405.5 + ], + "position": 16, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 145.02, + "center": [ + 647.5, + 403.5 + ], + "position": 17, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 147.83, + "center": [ + 682.5, + 401.5 + ], + "position": 18, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 152.36, + "center": [ + 717.5, + 398.0 + ], + "position": 19, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 154.44, + "center": [ + 752.5, + 396.5 + ], + "position": 20, + "color": [ + 80, + 16, + 111 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 109.85, + "initial_center": [ + 889.5, + 430.0 + ], + "final_center": [ + 297.5, + 430.0 + ], + "insertion_position": 7, + "color": [ + 176, + 103, + 29 + ], + "color_name": "orange", + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 121.18, + "initial_center": [ + 819.5, + 421.5 + ], + "final_center": [ + 332.5, + 421.5 + ], + "insertion_position": 8, + "color": [ + 176, + 103, + 29 + ], + "color_name": "orange", + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 141.18, + "initial_center": [ + 959.5, + 406.5 + ], + "final_center": [ + 402.5, + 406.5 + ], + "insertion_position": 10, + "color": [ + 176, + 103, + 29 + ], + "color_name": "orange", + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 141.18, + "initial_center": [ + 854.5, + 406.5 + ], + "final_center": [ + 437.5, + 406.5 + ], + "insertion_position": 11, + "color": [ + 176, + 103, + 29 + ], + "color_name": "orange", + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 154.44, + "initial_center": [ + 924.5, + 396.5 + ], + "final_center": [ + 577.5, + 396.5 + ], + "insertion_position": 15, + "color": [ + 176, + 103, + 29 + ], + "color_name": "orange", + "width": 29 + } + ] + }, + "param_hash": "4edfd3074b252613", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000000/prompt.txt b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..194243422744e75551461004fa36008b572dfb78 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000000/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a bookshelf with a set of books already placed, and a few orange books waiting on the right. There are gaps between the books on the shelf. Place each orange book into a gap where its height is closest to the surrounding books. Show the insertion process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000001/final_frame.png b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4817183b51062601f3481b926b8464388400c5be Binary files /dev/null and b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/final_frame.png differ diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000001/first_frame.png b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9a494150af9bc2120ee66dd5b7c34501605d6ab5 Binary files /dev/null and b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/first_frame.png differ diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000001/ground_truth.mp4 b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2fa245b24daeb7954d0e06158971807fd06f732c --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37c4c88a17ff11fbfd4095c4ba7358e6fced1dc3bf2100bd355ad0105e84c41 +size 444833 diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000001/metadata.json b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d0961801f35affae80e5dd87ce7db86afbbdd6a5 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/metadata.json @@ -0,0 +1,382 @@ +{ + "task_id": "bookshelf_00000001", + "generator": "bookshelf", + "timestamp": "2026-02-17T07:47:12.959929", + "parameters": { + "num_existing": 16, + "num_new": 5, + "objects": [ + { + "symbol": "book", + "type": "existing", + "height": 82.56, + "center": [ + 50.0, + 450.5 + ], + "position": 0, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 83.53, + "center": [ + 140.0, + 449.5 + ], + "position": 3, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 85.9, + "center": [ + 170.0, + 448.0 + ], + "position": 4, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 91.18, + "center": [ + 200.0, + 444.0 + ], + "position": 5, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 94.94, + "center": [ + 230.0, + 441.0 + ], + "position": 6, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 101.53, + "center": [ + 260.0, + 436.0 + ], + "position": 7, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 114.58, + "center": [ + 320.0, + 426.5 + ], + "position": 9, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 115.19, + "center": [ + 350.0, + 426.0 + ], + "position": 10, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 117.44, + "center": [ + 440.0, + 424.0 + ], + "position": 13, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 125.03, + "center": [ + 470.0, + 418.5 + ], + "position": 14, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 135.95, + "center": [ + 500.0, + 410.5 + ], + "position": 15, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 153.63, + "center": [ + 530.0, + 397.0 + ], + "position": 16, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 161.0, + "center": [ + 560.0, + 391.5 + ], + "position": 17, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 167.79, + "center": [ + 590.0, + 386.5 + ], + "position": 18, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 168.99, + "center": [ + 620.0, + 385.5 + ], + "position": 19, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "existing", + "height": 174.62, + "center": [ + 650.0, + 381.5 + ], + "position": 20, + "color": [ + 46, + 149, + 141 + ], + "width": 24 + }, + { + "symbol": "book", + "type": "new", + "height": 82.56, + "initial_center": [ + 832.0, + 450.5 + ], + "final_center": [ + 80.0, + 450.5 + ], + "insertion_position": 1, + "color": [ + 186, + 47, + 47 + ], + "color_name": "red", + "width": 24 + }, + { + "symbol": "book", + "type": "new", + "height": 83.53, + "initial_center": [ + 772.0, + 449.5 + ], + "final_center": [ + 110.0, + 449.5 + ], + "insertion_position": 2, + "color": [ + 186, + 47, + 47 + ], + "color_name": "red", + "width": 24 + }, + { + "symbol": "book", + "type": "new", + "height": 115.19, + "initial_center": [ + 802.0, + 426.0 + ], + "final_center": [ + 290.0, + 426.0 + ], + "insertion_position": 8, + "color": [ + 186, + 47, + 47 + ], + "color_name": "red", + "width": 24 + }, + { + "symbol": "book", + "type": "new", + "height": 135.95, + "initial_center": [ + 712.0, + 410.5 + ], + "final_center": [ + 380.0, + 410.5 + ], + "insertion_position": 11, + "color": [ + 186, + 47, + 47 + ], + "color_name": "red", + "width": 24 + }, + { + "symbol": "book", + "type": "new", + "height": 161.0, + "initial_center": [ + 742.0, + 391.5 + ], + "final_center": [ + 410.0, + 391.5 + ], + "insertion_position": 12, + "color": [ + 186, + 47, + 47 + ], + "color_name": "red", + "width": 24 + } + ] + }, + "param_hash": "0a73bccc5d620107", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000001/prompt.txt b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..98f8b52e28c8d904808633f59fc94609c0baae02 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000001/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a bookshelf with a set of books already placed, and a few red books waiting on the right. There are gaps between the books on the shelf. Place each red book into a gap where its height is closest to the surrounding books. Show the insertion process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000002/final_frame.png b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..95da40f9740ce93dc6a128a569130faef21016ca Binary files /dev/null and b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/final_frame.png differ diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000002/first_frame.png b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b7c6e8c894ccc967abc84fedb2374a1151b5c8fb Binary files /dev/null and b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/first_frame.png differ diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000002/ground_truth.mp4 b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4651033b71243478c1b71a7893a8db594dc663d4 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4e783684efb3ae549f4a0f6cdfee319e14ef0097f1dccbe3464339815edbaf7 +size 407772 diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000002/metadata.json b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5ff8700565f6bffd84d9a3bdb94e1eaf60b6852b --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/metadata.json @@ -0,0 +1,319 @@ +{ + "task_id": "bookshelf_00000002", + "generator": "bookshelf", + "timestamp": "2026-02-17T07:47:13.924878", + "parameters": { + "num_existing": 16, + "num_new": 2, + "objects": [ + { + "symbol": "book", + "type": "existing", + "height": 76.21, + "center": [ + 52.5, + 455.0 + ], + "position": 0, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 81.02, + "center": [ + 87.5, + 451.5 + ], + "position": 1, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 85.41, + "center": [ + 122.5, + 448.0 + ], + "position": 2, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 86.58, + "center": [ + 157.5, + 447.5 + ], + "position": 3, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 105.79, + "center": [ + 192.5, + 433.0 + ], + "position": 4, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 108.06, + "center": [ + 227.5, + 431.0 + ], + "position": 5, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 119.63, + "center": [ + 297.5, + 422.5 + ], + "position": 7, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 124.87, + "center": [ + 332.5, + 418.5 + ], + "position": 8, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 132.75, + "center": [ + 402.5, + 412.5 + ], + "position": 10, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 133.92, + "center": [ + 437.5, + 412.0 + ], + "position": 11, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 134.74, + "center": [ + 472.5, + 411.0 + ], + "position": 12, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 146.29, + "center": [ + 507.5, + 402.5 + ], + "position": 13, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 171.15, + "center": [ + 542.5, + 384.0 + ], + "position": 14, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 172.11, + "center": [ + 577.5, + 383.0 + ], + "position": 15, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 174.84, + "center": [ + 612.5, + 381.0 + ], + "position": 16, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "existing", + "height": 182.45, + "center": [ + 647.5, + 375.5 + ], + "position": 17, + "color": [ + 123, + 38, + 90 + ], + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 108.06, + "initial_center": [ + 714.5, + 431.0 + ], + "final_center": [ + 262.5, + 431.0 + ], + "insertion_position": 6, + "color": [ + 17, + 161, + 17 + ], + "color_name": "green", + "width": 29 + }, + { + "symbol": "book", + "type": "new", + "height": 132.75, + "initial_center": [ + 749.5, + 412.5 + ], + "final_center": [ + 367.5, + 412.5 + ], + "insertion_position": 9, + "color": [ + 17, + 161, + 17 + ], + "color_name": "green", + "width": 29 + } + ] + }, + "param_hash": "7cb939edc57a0d06", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/bookshelf_task/bookshelf_00000002/prompt.txt b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0d2342117b4be8fe296d73123002feba9c9b99c1 --- /dev/null +++ b/VBVR-Dataset/bookshelf_task/bookshelf_00000002/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a bookshelf with a set of books already placed, and a few green books waiting on the right. There are gaps between the books on the shelf. Place each green book into a gap where its height is closest to the surrounding books. Show the insertion process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/final_frame.png b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ee1d7358c447bf215de630179b9dae9a304b107e Binary files /dev/null and b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/final_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/first_frame.png b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8b80ff51161cfe8f4a314ada45ec1817fadd3ec5 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/first_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/ground_truth.mp4 b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f88053ee173709db5a13fcaeeb9a692f60d789e5 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af10c7880abcfacf42870719eaaf817ed1fd1d5e6c59e7fee098d92c14a7906f +size 279272 diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/metadata.json b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..206baba7a20d02d1ed6a5466b4cfdb4da13c3b05 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/metadata.json @@ -0,0 +1,29 @@ +{ + "task_id": "chart_extreme_with_data_00000000", + "generator": "chart_extreme_with_data", + "timestamp": "2026-02-17T07:19:51.779443", + "parameters": { + "chart_type": "bar", + "values": [ + 33544.0, + 32685.0, + 17101.0 + ], + "metadata": { + "_type": "ChartMetadata" + }, + "extreme_type": "min", + "target_index": 2, + "target_value": 17101.0 + }, + "param_hash": "bb495fac09292a6a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/prompt.txt b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a0efb64b3c644ad16648c4d7b5f53d1801a51a37 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a bar chart titled 'Monthly Product Sales Statistics 2024' with Month on the x-axis and Sales on the y-axis. Find the month with the lowest sales and draw a red rectangular border around the corresponding bar to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/final_frame.png b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..83672503680de49c1e33be77cb0d9cc7586d931b Binary files /dev/null and b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/final_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/first_frame.png b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..797c87bc5e80e76beebd71c11de089f0efdedac3 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/first_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/ground_truth.mp4 b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5cfcaa349c23aeea9ccfb92e1a8553352a64c690 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5481220f515cfd7ca8822277fc68ec65d18f1890b752128d07a2cc63e3501f4 +size 345079 diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/metadata.json b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..498e4fd4d74078056859d56bdf37eb77b7657210 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/metadata.json @@ -0,0 +1,29 @@ +{ + "task_id": "chart_extreme_with_data_00000001", + "generator": "chart_extreme_with_data", + "timestamp": "2026-02-17T07:19:52.220969", + "parameters": { + "chart_type": "pie", + "values": [ + 33.7, + 42.0, + 24.3 + ], + "metadata": { + "_type": "ChartMetadata" + }, + "extreme_type": "max", + "target_index": 1, + "target_value": 42.0 + }, + "param_hash": "da04ce5b6d25d2f5", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/prompt.txt b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..274097235eab92f911af2d971bf022efb8ffad07 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a pie chart titled 'Product Category Sales Share 2024'. Find the category with the largest sales and draw a red rectangular border around the corresponding segment to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/final_frame.png b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..27eb3e50f266abb433693e3007c9873730cf47b7 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/final_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/first_frame.png b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6e878de63a5e527d7e6367224c93c5dc039bc018 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/first_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/ground_truth.mp4 b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a74e32d1ada92682c62095290fff44f7298ed6c9 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c24b34182d85f89a258493a13896867720a135752a8791043efae21c4d6985e +size 266663 diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/metadata.json b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ca462c69aca2a28d3dbae1082a34e3d6b50c3648 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "chart_extreme_with_data_00000002", + "generator": "chart_extreme_with_data", + "timestamp": "2026-02-17T07:19:52.726022", + "parameters": { + "chart_type": "scatter", + "values": [ + 67.3, + 72.6, + 79.5, + 86.5, + 84.8 + ], + "x_values": [ + 61.8, + 67.9, + 71.7, + 77.7, + 82.8 + ], + "metadata": { + "_type": "ChartMetadata" + }, + "extreme_type": "min", + "target_index": 0, + "target_value": 67.3 + }, + "param_hash": "45a1a02f1375b69a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/prompt.txt b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d3dda9fba508f3fa842fc8686352c7d999b2dcb --- /dev/null +++ b/VBVR-Dataset/chart_extreme_with_data_task/chart_extreme_with_data_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a scatter chart titled 'Correlation Analysis: Math vs Physics Scores' with Math Score on the x-axis and Physics Score on the y-axis. Find the point with the lowest physics score and draw a red rectangular border around the corresponding point to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/final_frame.png b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d15e97418bd7481d5f9fd5025a4253e6a256593a Binary files /dev/null and b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/final_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/first_frame.png b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f9fc175cc877e54bc5317fe45a09781512d2c683 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/first_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/ground_truth.mp4 b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..9e829f70d9d21ba86d5d4540caa92cd6bc8275da --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e2bc8dea09d563801f727fa16f9c19488a0b3c0ce503bcd1eceb83142713e2 +size 202716 diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/metadata.json b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8e0d7aae1f8f2da9fb2064d01630b7b22ee3ff1c --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/metadata.json @@ -0,0 +1,105 @@ +{ + "task_id": "chart_extreme_without_data_00000000", + "generator": "chart_extreme_without_data", + "timestamp": "2026-02-17T07:20:50.004530", + "parameters": { + "chart_type": "bar", + "values": [ + 22, + 19, + 95, + 81, + 92, + 52, + 48, + 66 + ], + "data_points": [ + { + "index": 0, + "value": 22, + "color": [ + 70, + 130, + 180 + ] + }, + { + "index": 1, + "value": 19, + "color": [ + 135, + 206, + 235 + ] + }, + { + "index": 2, + "value": 95, + "color": [ + 255, + 140, + 0 + ] + }, + { + "index": 3, + "value": 81, + "color": [ + 32, + 178, + 170 + ] + }, + { + "index": 4, + "value": 92, + "color": [ + 255, + 20, + 147 + ] + }, + { + "index": 5, + "value": 52, + "color": [ + 50, + 205, + 50 + ] + }, + { + "index": 6, + "value": 48, + "color": [ + 255, + 165, + 0 + ] + }, + { + "index": 7, + "value": 66, + "color": [ + 138, + 43, + 226 + ] + } + ], + "extreme_type": "min", + "target_index": 1, + "target_value": 19 + }, + "param_hash": "fa2084f18d4bc12d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/prompt.txt b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..519f6b5bab08344c0430b4a12b2c9ec7771aef24 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a bar chart. Find the minimum value bar and draw a red rectangular border around the corresponding bar to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/final_frame.png b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..773c2712f71d01062ce95f998dba828b4aa7fd1a Binary files /dev/null and b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/final_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/first_frame.png b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..cd8182ba0ee8ac1b5be91d043ee0abf854e717d6 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/first_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/ground_truth.mp4 b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..dfafc2432ced38e18c64fb91ac66c06652f467ac --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0970fe43759f1da0b36db8089d256cffb4ffed0c9d5bd48ea2fd6f9fc56d31aa +size 216031 diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/metadata.json b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1a9e717546e72b3ab583d73dff1d6f170d17aa1b --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/metadata.json @@ -0,0 +1,95 @@ +{ + "task_id": "chart_extreme_without_data_00000001", + "generator": "chart_extreme_without_data", + "timestamp": "2026-02-17T07:20:50.446323", + "parameters": { + "chart_type": "bar", + "values": [ + 24, + 91, + 25, + 89, + 90, + 74, + 88 + ], + "data_points": [ + { + "index": 0, + "value": 24, + "color": [ + 70, + 130, + 180 + ] + }, + { + "index": 1, + "value": 91, + "color": [ + 135, + 206, + 235 + ] + }, + { + "index": 2, + "value": 25, + "color": [ + 255, + 140, + 0 + ] + }, + { + "index": 3, + "value": 89, + "color": [ + 32, + 178, + 170 + ] + }, + { + "index": 4, + "value": 90, + "color": [ + 255, + 20, + 147 + ] + }, + { + "index": 5, + "value": 74, + "color": [ + 50, + 205, + 50 + ] + }, + { + "index": 6, + "value": 88, + "color": [ + 255, + 165, + 0 + ] + } + ], + "extreme_type": "max", + "target_index": 1, + "target_value": 91 + }, + "param_hash": "47edef66033abf15", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/prompt.txt b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..85f572c637bce6de2632592b2d759fab18ac5211 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a bar chart. Find the maximum value bar and draw a red rectangular border around the corresponding bar to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/final_frame.png b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..15e30f0f999b2f8e3cba04bb2690111c707b8058 Binary files /dev/null and b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/final_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/first_frame.png b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4b85e6e0343c37483b680546f1217c5f2de1756c Binary files /dev/null and b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/first_frame.png differ diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/ground_truth.mp4 b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d7d90b67f1bd87bea25c789ecfa2744c6dfd0d92 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcdc191be3fd6072bd39e7b83ffa007d7b98d9a1da416be7e4c417ec9eccd3a +size 172502 diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/metadata.json b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8b557ee9632974c571cb89ad48eb4674f2022989 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "chart_extreme_without_data_00000002", + "generator": "chart_extreme_without_data", + "timestamp": "2026-02-17T07:20:50.875928", + "parameters": { + "chart_type": "line", + "values": [ + 87, + 10, + 26, + 13, + 23, + 64 + ], + "data_points": [ + { + "index": 0, + "value": 87, + "color": [ + 70, + 130, + 180 + ] + }, + { + "index": 1, + "value": 10, + "color": [ + 135, + 206, + 235 + ] + }, + { + "index": 2, + "value": 26, + "color": [ + 255, + 140, + 0 + ] + }, + { + "index": 3, + "value": 13, + "color": [ + 32, + 178, + 170 + ] + }, + { + "index": 4, + "value": 23, + "color": [ + 255, + 20, + 147 + ] + }, + { + "index": 5, + "value": 64, + "color": [ + 50, + 205, + 50 + ] + } + ], + "extreme_type": "max", + "target_index": 0, + "target_value": 87 + }, + "param_hash": "21b5cd46aa8f7afa", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/prompt.txt b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..7a6abf9514ca028a2dcb76e11184740f97fc4c89 --- /dev/null +++ b/VBVR-Dataset/chart_extreme_without_data_task/chart_extreme_without_data_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a line chart. Find the maximum value point and draw a red rectangular border around the corresponding point to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/final_frame.png b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..86b0738acad294656c2da3e12db425ff0fe11c69 Binary files /dev/null and b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/final_frame.png differ diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/first_frame.png b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..756256bd898b7790c567f96e74defdbdf5406c04 Binary files /dev/null and b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/first_frame.png differ diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/ground_truth.mp4 b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2cd6d8040cac7b4e9e7df1307c3c11affc1fd5ec --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1906ea5f90ac88b9aeba29cc88b07a6ed4ab4f317195b21b4f8fbe0ceb7fe80 +size 253974 diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/metadata.json b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..c508f3406c827cf476b90ce9dc608c1e8b6eb5f6 --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "circle_all_squares_from_mixed_shapes_00000000", + "generator": "circle_all_squares_from_mixed_shapes", + "timestamp": "2026-02-17T06:54:30.507124", + "parameters": { + "shapes": [ + { + "type": "rectangle", + "color": [ + 0, + 170, + 0 + ], + "center": [ + 318.0, + 608.0 + ], + "size": [ + 149.0, + 268.0 + ] + }, + { + "type": "square", + "color": [ + 255, + 215, + 0 + ], + "center": [ + 755.0, + 760.0 + ], + "size": [ + 94.0, + 94.0 + ] + }, + { + "type": "square", + "color": [ + 34, + 197, + 94 + ], + "center": [ + 742.0, + 125.0 + ], + "size": [ + 100.0, + 100.0 + ] + } + ], + "square_indices": [ + 1, + 2 + ] + }, + "param_hash": "ccf28c9aaf89f548", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/prompt.txt b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..954b3e81d5a55c198962c152e0e3c32978fcfe4f --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 axis-aligned squares and rectangles. A square has equal width and height, while a rectangle does not. First identify all squares, then draw one red circle around each square. Do not circle any rectangles. Show the complete circling process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/final_frame.png b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5edc08ee1bae77a2cdcbe3a90c68d64c5ad49bd4 Binary files /dev/null and b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/final_frame.png differ diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/first_frame.png b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..138da0c3342b2b92e0acf4f556c5c43e2c040b84 Binary files /dev/null and b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/first_frame.png differ diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/ground_truth.mp4 b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e49d401403766bd7dea00d0369a9863e01b72dbf --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fff68f13c125c9e5522774d7d2ca922ffa7c4183525b4825990d52ade4832f +size 347969 diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/metadata.json b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0977eac5a834bb9c275c5fff4942dac95017ff4e --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/metadata.json @@ -0,0 +1,72 @@ +{ + "task_id": "circle_all_squares_from_mixed_shapes_00000001", + "generator": "circle_all_squares_from_mixed_shapes", + "timestamp": "2026-02-17T06:54:31.154448", + "parameters": { + "shapes": [ + { + "type": "square", + "color": [ + 99, + 102, + 241 + ], + "center": [ + 683.0, + 797.0 + ], + "size": [ + 127.0, + 127.0 + ] + }, + { + "type": "square", + "color": [ + 255, + 105, + 180 + ], + "center": [ + 618.0, + 356.0 + ], + "size": [ + 150.0, + 150.0 + ] + }, + { + "type": "square", + "color": [ + 0, + 0, + 0 + ], + "center": [ + 382.0, + 806.0 + ], + "size": [ + 83.0, + 83.0 + ] + } + ], + "square_indices": [ + 0, + 1, + 2 + ] + }, + "param_hash": "a3b465204647b12b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/prompt.txt b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..954b3e81d5a55c198962c152e0e3c32978fcfe4f --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 axis-aligned squares and rectangles. A square has equal width and height, while a rectangle does not. First identify all squares, then draw one red circle around each square. Do not circle any rectangles. Show the complete circling process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/final_frame.png b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c80304e60254d46aba3e397c61b8f69078bf8c02 Binary files /dev/null and b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/final_frame.png differ diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/first_frame.png b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f709fc38b13e6426bee55e0d264e2ad9b87a1ee8 Binary files /dev/null and b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/first_frame.png differ diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/ground_truth.mp4 b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8945550537eab761de458d99851dbba4b4131c26 --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a41d3657e66db03819a063cdb28feb6ebf2b83e1ee77b584b91a34162db2559 +size 222757 diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/metadata.json b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8580ef188b1974b0ff96a286e555e34f678c96b8 --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/metadata.json @@ -0,0 +1,70 @@ +{ + "task_id": "circle_all_squares_from_mixed_shapes_00000002", + "generator": "circle_all_squares_from_mixed_shapes", + "timestamp": "2026-02-17T06:54:31.763351", + "parameters": { + "shapes": [ + { + "type": "rectangle", + "color": [ + 120, + 120, + 120 + ], + "center": [ + 530.0, + 825.0 + ], + "size": [ + 158.0, + 103.0 + ] + }, + { + "type": "square", + "color": [ + 75, + 0, + 130 + ], + "center": [ + 664.0, + 509.0 + ], + "size": [ + 168.0, + 168.0 + ] + }, + { + "type": "rectangle", + "color": [ + 0, + 170, + 0 + ], + "center": [ + 712.0, + 240.0 + ], + "size": [ + 154.0, + 85.0 + ] + } + ], + "square_indices": [ + 1 + ] + }, + "param_hash": "f5b00ed087a2e051", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/prompt.txt b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..954b3e81d5a55c198962c152e0e3c32978fcfe4f --- /dev/null +++ b/VBVR-Dataset/circle_all_squares_from_mixed_shapes_task/circle_all_squares_from_mixed_shapes_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 axis-aligned squares and rectangles. A square has equal width and height, while a rectangle does not. First identify all squares, then draw one red circle around each square. Do not circle any rectangles. Show the complete circling process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/final_frame.png b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..84f2f601cf2396cd8d842c8a4a5c442ace07d773 Binary files /dev/null and b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/final_frame.png differ diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/first_frame.png b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8f68c76ad74f478416b64ebb60686050cc603a70 Binary files /dev/null and b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/first_frame.png differ diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/ground_truth.mp4 b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2625db31081bebd08783516361faca1c36d3f4df --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200f8a0ae1d2e600127f6dc7c6936fef760dce1671e0f059382ca57a6f661191 +size 246489 diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/metadata.json b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..51a04cd3a0d26b41f1d5166423cce340eb5d9bd0 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/metadata.json @@ -0,0 +1,64 @@ +{ + "task_id": "circle_maximum_value_00000000", + "generator": "circle_maximum_value", + "timestamp": "2026-02-17T07:08:26.417486", + "parameters": { + "numbers": [ + 95, + 96, + 69, + 13 + ], + "positions": [ + [ + 617, + 333 + ], + [ + 228, + 428 + ], + [ + 729, + 843 + ], + [ + 777, + 522 + ] + ], + "colors": [ + [ + 206, + 236, + 105 + ], + [ + 178, + 36, + 74 + ], + [ + 240, + 135, + 10 + ], + [ + 87, + 181, + 169 + ] + ], + "max_index": 1 + }, + "param_hash": "a644b3858cdc15a8", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/prompt.txt b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c99764b541b1fc7932230197aec716d1ff3f0a6 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000000/prompt.txt @@ -0,0 +1 @@ +There are multiple numbers on the screen, circle the one with the largest value \ No newline at end of file diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/final_frame.png b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..10885cb492fb6db70fce73b502bed3bb55ea7334 Binary files /dev/null and b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/final_frame.png differ diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/first_frame.png b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c12057909d73223187d5e89612a4e96940d23bf4 Binary files /dev/null and b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/first_frame.png differ diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/ground_truth.mp4 b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..51667c6590de5a207d83b55a9a8576da133499a0 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf5409913190d4d651210a4bee9c4e6c79031eb9cbb54359a11e2e60873d9621 +size 248368 diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/metadata.json b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b42f9ad4631e3d7107f171c7d7211752e7274eb1 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/metadata.json @@ -0,0 +1,84 @@ +{ + "task_id": "circle_maximum_value_00000001", + "generator": "circle_maximum_value", + "timestamp": "2026-02-17T07:08:26.903777", + "parameters": { + "numbers": [ + 47, + 92, + 54, + 98, + 48, + 91 + ], + "positions": [ + [ + 358, + 355 + ], + [ + 207, + 731 + ], + [ + 446, + 620 + ], + [ + 275, + 201 + ], + [ + 678, + 683 + ], + [ + 198, + 450 + ] + ], + "colors": [ + [ + 171, + 64, + 231 + ], + [ + 13, + 147, + 108 + ], + [ + 31, + 227, + 213 + ], + [ + 184, + 152, + 129 + ], + [ + 210, + 215, + 191 + ], + [ + 57, + 197, + 217 + ] + ], + "max_index": 3 + }, + "param_hash": "89e149d1e68b19a1", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/prompt.txt b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c99764b541b1fc7932230197aec716d1ff3f0a6 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000001/prompt.txt @@ -0,0 +1 @@ +There are multiple numbers on the screen, circle the one with the largest value \ No newline at end of file diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/final_frame.png b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..10706df6e80479e54aae31cd9c450ad9b834fe66 Binary files /dev/null and b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/final_frame.png differ diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/first_frame.png b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d12486360749a10a309ecabe751764c61a07601d Binary files /dev/null and b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/first_frame.png differ diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/ground_truth.mp4 b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f9bfe28f1b3128d790920fdeb945c21201c50d45 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a23d72a485ca17b16d7ff76ea3286de999a620de7ad4e4c68513c66c74c5de2 +size 254542 diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/metadata.json b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8c20b25e848e0c4a56931edc90931a6a4e57d3b9 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "circle_maximum_value_00000002", + "generator": "circle_maximum_value", + "timestamp": "2026-02-17T07:08:27.396670", + "parameters": { + "numbers": [ + 91, + 95, + 56, + 99, + 39 + ], + "positions": [ + [ + 424, + 526 + ], + [ + 632, + 308 + ], + [ + 624, + 610 + ], + [ + 236, + 716 + ], + [ + 249, + 468 + ] + ], + "colors": [ + [ + 169, + 41, + 69 + ], + [ + 57, + 68, + 29 + ], + [ + 201, + 58, + 233 + ], + [ + 119, + 210, + 167 + ], + [ + 121, + 131, + 172 + ] + ], + "max_index": 3 + }, + "param_hash": "a1b69133d350f7fa", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/prompt.txt b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4c99764b541b1fc7932230197aec716d1ff3f0a6 --- /dev/null +++ b/VBVR-Dataset/circle_maximum_value_task/circle_maximum_value_00000002/prompt.txt @@ -0,0 +1 @@ +There are multiple numbers on the screen, circle the one with the largest value \ No newline at end of file diff --git a/VBVR-Dataset/clock_task/clock_00000000/final_frame.png b/VBVR-Dataset/clock_task/clock_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..73729d5ff0a3b9444fb87a1941b20488666696e1 Binary files /dev/null and b/VBVR-Dataset/clock_task/clock_00000000/final_frame.png differ diff --git a/VBVR-Dataset/clock_task/clock_00000000/first_frame.png b/VBVR-Dataset/clock_task/clock_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..73729d5ff0a3b9444fb87a1941b20488666696e1 Binary files /dev/null and b/VBVR-Dataset/clock_task/clock_00000000/first_frame.png differ diff --git a/VBVR-Dataset/clock_task/clock_00000000/ground_truth.mp4 b/VBVR-Dataset/clock_task/clock_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..918d2942c1de79bb0d69e631ee2e3576222a29a8 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeff3da270e14d7bf53b8f417cc591459483de312e677fbe5d88555fcbe1abc1 +size 1213097 diff --git a/VBVR-Dataset/clock_task/clock_00000000/metadata.json b/VBVR-Dataset/clock_task/clock_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a3792ac097f72d8729b7aa3136b1e858211316c6 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000000/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "clock_00000000", + "generator": "clock", + "timestamp": "2026-02-17T07:59:13.229114", + "parameters": { + "initial_hour": 3, + "initial_minute": 49, + "final_hour": 3, + "final_minute": 49, + "hours_to_add": 24, + "initial_time": "3:49", + "final_time": "3:49", + "objects": [ + { + "symbol": "clock_face", + "center": [ + 512, + 512 + ], + "radius": 409, + "background_color": "#FFFACD", + "border_color": "black", + "number_style": "none" + }, + { + "symbol": "hour_hand", + "initial_angle": -24.5, + "initial_position": [ + 698.09, + 596.8 + ], + "final_angle": -24.5, + "final_position": [ + 698.09, + 596.8 + ], + "color": "black", + "length": 204.5 + }, + { + "symbol": "minute_hand", + "initial_angle": -204.0, + "initial_position": [ + 250.45, + 395.55 + ], + "final_angle": -204.0, + "final_position": [ + 250.45, + 395.55 + ], + "color": "#9370DB", + "length": 286.3 + }, + { + "symbol": "center", + "position": [ + 512, + 512 + ] + } + ] + }, + "param_hash": "1c17293cb81fcb5b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/clock_task/clock_00000000/prompt.txt b/VBVR-Dataset/clock_task/clock_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5f94caaff20786ec4c8c085904b970625fff6f2 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000000/prompt.txt @@ -0,0 +1 @@ +The clock shows 3:49. Show what the clock will look like after 24 hours. \ No newline at end of file diff --git a/VBVR-Dataset/clock_task/clock_00000001/final_frame.png b/VBVR-Dataset/clock_task/clock_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..861725bb26263f9077769c310d76fac95357e560 Binary files /dev/null and b/VBVR-Dataset/clock_task/clock_00000001/final_frame.png differ diff --git a/VBVR-Dataset/clock_task/clock_00000001/first_frame.png b/VBVR-Dataset/clock_task/clock_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..083ce8389cb608e03a9f93faa7cb59e12c5a346d Binary files /dev/null and b/VBVR-Dataset/clock_task/clock_00000001/first_frame.png differ diff --git a/VBVR-Dataset/clock_task/clock_00000001/ground_truth.mp4 b/VBVR-Dataset/clock_task/clock_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..594095d322aa156ea2f177cbdf46312539677e6e --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3c8204b53e35f3a3a54190541ed3460a46b48f79d7be9ee61a2a979889e8dd +size 1215918 diff --git a/VBVR-Dataset/clock_task/clock_00000001/metadata.json b/VBVR-Dataset/clock_task/clock_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b67cc8b0dd2b8cdcd4242588773ab6800bde4b61 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000001/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "clock_00000001", + "generator": "clock", + "timestamp": "2026-02-17T07:59:14.716832", + "parameters": { + "initial_hour": 5, + "initial_minute": 48, + "final_hour": 3, + "final_minute": 48, + "hours_to_add": 10, + "initial_time": "5:48", + "final_time": "3:48", + "objects": [ + { + "symbol": "clock_face", + "center": [ + 512, + 512 + ], + "radius": 409, + "background_color": "#F0F8FF", + "border_color": "#8B4513", + "number_style": "arabic" + }, + { + "symbol": "hour_hand", + "initial_angle": -84.0, + "initial_position": [ + 533.38, + 715.38 + ], + "final_angle": -24.0, + "final_position": [ + 698.82, + 595.18 + ], + "color": "#00008B", + "length": 204.5 + }, + { + "symbol": "minute_hand", + "initial_angle": -198.0, + "initial_position": [ + 239.71, + 423.53 + ], + "final_angle": -198.0, + "final_position": [ + 239.71, + 423.53 + ], + "color": "#DC143C", + "length": 286.3 + }, + { + "symbol": "center", + "position": [ + 512, + 512 + ] + } + ] + }, + "param_hash": "69889b3b0d80d298", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/clock_task/clock_00000001/prompt.txt b/VBVR-Dataset/clock_task/clock_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e9ba129dce1505f7565d5cc94b488816468f7c69 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000001/prompt.txt @@ -0,0 +1 @@ +The clock shows 5:48. Show what the clock will look like after 10 hours. \ No newline at end of file diff --git a/VBVR-Dataset/clock_task/clock_00000002/final_frame.png b/VBVR-Dataset/clock_task/clock_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..55d60299fab7b83a8035110e034dd0dde23645a0 Binary files /dev/null and b/VBVR-Dataset/clock_task/clock_00000002/final_frame.png differ diff --git a/VBVR-Dataset/clock_task/clock_00000002/first_frame.png b/VBVR-Dataset/clock_task/clock_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..870e01d57d1c92b74a163b752071bb448e8f6eca Binary files /dev/null and b/VBVR-Dataset/clock_task/clock_00000002/first_frame.png differ diff --git a/VBVR-Dataset/clock_task/clock_00000002/ground_truth.mp4 b/VBVR-Dataset/clock_task/clock_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..1ebbda017ab248bcc8123e1145e97540dd07ac8b --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a946e213527bc8e6bd86c5a746b5c586bd186889b7afc769ee24f343c0a0e99 +size 1125687 diff --git a/VBVR-Dataset/clock_task/clock_00000002/metadata.json b/VBVR-Dataset/clock_task/clock_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a20567a2c4e8bf32aca2fedc5c1075ea2656d983 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000002/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "clock_00000002", + "generator": "clock", + "timestamp": "2026-02-17T07:59:16.225076", + "parameters": { + "initial_hour": 10, + "initial_minute": 7, + "final_hour": 6, + "final_minute": 7, + "hours_to_add": 20, + "initial_time": "10:07", + "final_time": "6:07", + "objects": [ + { + "symbol": "clock_face", + "center": [ + 512, + 512 + ], + "radius": 409, + "background_color": "#F5F5DC", + "border_color": "#696969", + "number_style": "roman" + }, + { + "symbol": "hour_hand", + "initial_angle": -213.5, + "initial_position": [ + 341.47, + 399.13 + ], + "final_angle": -93.5, + "final_position": [ + 499.52, + 716.12 + ], + "color": "#4B0082", + "length": 204.5 + }, + { + "symbol": "minute_hand", + "initial_angle": 48.0, + "initial_position": [ + 703.57, + 299.24 + ], + "final_angle": 48.0, + "final_position": [ + 703.57, + 299.24 + ], + "color": "#4169E1", + "length": 286.3 + }, + { + "symbol": "center", + "position": [ + 512, + 512 + ] + } + ] + }, + "param_hash": "5b646a61795d3f25", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/clock_task/clock_00000002/prompt.txt b/VBVR-Dataset/clock_task/clock_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..388d160a00fec181d9404c7b7a53091779ac3504 --- /dev/null +++ b/VBVR-Dataset/clock_task/clock_00000002/prompt.txt @@ -0,0 +1 @@ +The clock shows 10:07. Show what the clock will look like after 20 hours. \ No newline at end of file diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000000/final_frame.png b/VBVR-Dataset/color_addition_task/color_addition_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c8fa20c7582d928002544e879a4ee31b1b7bcb04 Binary files /dev/null and b/VBVR-Dataset/color_addition_task/color_addition_00000000/final_frame.png differ diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000000/first_frame.png b/VBVR-Dataset/color_addition_task/color_addition_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..df0292fe0d59d1ac266e7fbc547d6c543b76f624 Binary files /dev/null and b/VBVR-Dataset/color_addition_task/color_addition_00000000/first_frame.png differ diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000000/ground_truth.mp4 b/VBVR-Dataset/color_addition_task/color_addition_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..18110d2322b49738276afa26b90571dc90fcc16f --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2924be7ac9b2e6abc289ef255e8b9f89449dff27b8d1b3ef3270876de99f1aef +size 457374 diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000000/metadata.json b/VBVR-Dataset/color_addition_task/color_addition_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..e0487090fe02be1d7a3835c1ef5f309afc47c105 --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000000/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "color_addition_00000000", + "generator": "color_addition", + "timestamp": "2026-02-17T07:39:27.020949", + "parameters": { + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 282, + 737 + ], + "color": [ + 102, + 249, + 238 + ], + "radius": 120 + }, + { + "symbol": "ball", + "initial_center": [ + 346, + 292 + ], + "color": [ + 187, + 74, + 68 + ], + "radius": 120 + }, + { + "symbol": "ball", + "final_center": [ + 314.0, + 514.5 + ], + "color": [ + 228, + 255, + 241 + ], + "radius": 120 + } + ] + }, + "param_hash": "15a710dc6033369f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000000/prompt.txt b/VBVR-Dataset/color_addition_task/color_addition_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..244db8e962cc0748d86d6f65fa549436d82dcf20 --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000000/prompt.txt @@ -0,0 +1 @@ +Two circular balls with different colors are positioned at different locations. Animate them moving toward each other at the same speed until they completely merge. When overlapping, the overlapping region displays the additive color mixture of their original colors. Stop when fully merged at the midpoint. \ No newline at end of file diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000001/final_frame.png b/VBVR-Dataset/color_addition_task/color_addition_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5b95cc13d5665bb0627204205d82f5f388a32c34 Binary files /dev/null and b/VBVR-Dataset/color_addition_task/color_addition_00000001/final_frame.png differ diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000001/first_frame.png b/VBVR-Dataset/color_addition_task/color_addition_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2b8685b46103898d063746e9f0ab5512bb233b03 Binary files /dev/null and b/VBVR-Dataset/color_addition_task/color_addition_00000001/first_frame.png differ diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000001/ground_truth.mp4 b/VBVR-Dataset/color_addition_task/color_addition_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..dcf41165ea9623d03c941d3ca79ab3e75d0df389 --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed983c2d10bae3cd8519261eb45f344e30fa587c82ff43b4253a0d1e8be09a1 +size 451293 diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000001/metadata.json b/VBVR-Dataset/color_addition_task/color_addition_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..68d9cd119dbaad0f70985aa364d24b5a40d15ac7 --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000001/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "color_addition_00000001", + "generator": "color_addition", + "timestamp": "2026-02-17T07:39:29.001471", + "parameters": { + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 340, + 291 + ], + "color": [ + 159, + 217, + 88 + ], + "radius": 120 + }, + { + "symbol": "ball", + "initial_center": [ + 710, + 529 + ], + "color": [ + 62, + 112, + 187 + ], + "radius": 120 + }, + { + "symbol": "ball", + "final_center": [ + 525.0, + 410.0 + ], + "color": [ + 171, + 255, + 213 + ], + "radius": 120 + } + ] + }, + "param_hash": "a1aa547f8a5d147c", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000001/prompt.txt b/VBVR-Dataset/color_addition_task/color_addition_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..52fe616c88d1c0b472986c2b36a82db8dfb91a30 --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000001/prompt.txt @@ -0,0 +1 @@ +Two colored circular balls start at separate positions. They move toward each other at equal speeds until fully overlapping and merging into one. The overlapping region and final merged ball show the additive color mixture of the two original colors. \ No newline at end of file diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000002/final_frame.png b/VBVR-Dataset/color_addition_task/color_addition_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b0d5965eece09ed573d692f31d32104261283ed8 Binary files /dev/null and b/VBVR-Dataset/color_addition_task/color_addition_00000002/final_frame.png differ diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000002/first_frame.png b/VBVR-Dataset/color_addition_task/color_addition_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..274451cb4295f74720b2bd5fc4833d8f79567a42 Binary files /dev/null and b/VBVR-Dataset/color_addition_task/color_addition_00000002/first_frame.png differ diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000002/ground_truth.mp4 b/VBVR-Dataset/color_addition_task/color_addition_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..18fb1fb24cb8a5498b197c0fccd74aafdbf8dcde --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083ac170046f49ba6f04e9e0f064ae145daf14f2462c10df6b76101eab0bca00 +size 475183 diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000002/metadata.json b/VBVR-Dataset/color_addition_task/color_addition_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..03e79475b53aa0303425c5602a11bb69201dd79d --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000002/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "color_addition_00000002", + "generator": "color_addition", + "timestamp": "2026-02-17T07:39:30.911159", + "parameters": { + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 289, + 415 + ], + "color": [ + 128, + 230, + 169 + ], + "radius": 120 + }, + { + "symbol": "ball", + "initial_center": [ + 731, + 451 + ], + "color": [ + 137, + 105, + 148 + ], + "radius": 120 + }, + { + "symbol": "ball", + "final_center": [ + 510.0, + 433.0 + ], + "color": [ + 201, + 255, + 241 + ], + "radius": 120 + } + ] + }, + "param_hash": "268aec5ed2c63445", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_addition_task/color_addition_00000002/prompt.txt b/VBVR-Dataset/color_addition_task/color_addition_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..52fe616c88d1c0b472986c2b36a82db8dfb91a30 --- /dev/null +++ b/VBVR-Dataset/color_addition_task/color_addition_00000002/prompt.txt @@ -0,0 +1 @@ +Two colored circular balls start at separate positions. They move toward each other at equal speeds until fully overlapping and merging into one. The overlapping region and final merged ball show the additive color mixture of the two original colors. \ No newline at end of file diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000000/final_frame.png b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d2b47ef6d6cfb9585409750129175d17e63aa870 Binary files /dev/null and b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/final_frame.png differ diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000000/first_frame.png b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9ce5418a8ab5d5c9ea39ad710aeb7787cb905060 Binary files /dev/null and b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/first_frame.png differ diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000000/ground_truth.mp4 b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..364e2aa6bbf1db5742f6eb573753924d540540e7 --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7026ee8fe5c34a94b02259776abc32a7831b3656e03f566872283ec59a4fbd +size 118072 diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000000/metadata.json b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..26d5bbf209d105c97771ccf1becb2b3f8625df10 --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/metadata.json @@ -0,0 +1,32 @@ +{ + "task_id": "color_mixing_00000000", + "generator": "color_mixing", + "timestamp": "2026-02-17T07:41:48.404084", + "parameters": { + "color1": [ + 52, + 24, + 18 + ], + "color2": [ + 84, + 77, + 113 + ], + "result": [ + 136, + 101, + 131 + ] + }, + "param_hash": "c05c98d65f55b077", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000000/prompt.txt b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..22126e0a392dd07d4de76ed037415201454af045 --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000000/prompt.txt @@ -0,0 +1 @@ +The scene has two colored light sources positioned on the left and right sides, and a mixing zone marked by a white rectangular border in the center. In additive color mixing (light mixing), when two lights overlap, their RGB components add together: result_R = min(color1_R + color2_R, 255), same for G and B, with each channel clamped to 255 maximum. First identify the RGB values of the left light (an RGB(52, 24, 18) colored light) and the right light (an RGB(84, 77, 113) colored light), then calculate the mixed color by adding their RGB components channel by channel. Fill the white-bordered mixing zone in the center with the resulting mixed color and show the full calculation process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000001/final_frame.png b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..df764d8ffd7115f80692b7aff96a9c17b9058811 Binary files /dev/null and b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/final_frame.png differ diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000001/first_frame.png b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4066d5b24cbfc6eed281b41d1a606a2f3083183c Binary files /dev/null and b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/first_frame.png differ diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000001/ground_truth.mp4 b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..370317ff06d89b089f9ab6f62c00c56afb35b3cb --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac21dfa1b3adc298af897d124096a31758d05a6f83e79641eeebd4567f8df1e +size 120169 diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000001/metadata.json b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4da059cf315d5310e8cd7b86a53552b9dfc45dc0 --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/metadata.json @@ -0,0 +1,32 @@ +{ + "task_id": "color_mixing_00000001", + "generator": "color_mixing", + "timestamp": "2026-02-17T07:41:49.251579", + "parameters": { + "color1": [ + 90, + 43, + 100 + ], + "color2": [ + 28, + 29, + 128 + ], + "result": [ + 118, + 72, + 228 + ] + }, + "param_hash": "b67c5ef80459b98a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000001/prompt.txt b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..eb5183325deeeda468bc1a9e50a1e5d518fc2ef0 --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000001/prompt.txt @@ -0,0 +1 @@ +The scene has two colored light sources positioned on the left and right sides, and a mixing zone marked by a white rectangular border in the center. In additive color mixing (light mixing), when two lights overlap, their RGB components add together: result_R = min(color1_R + color2_R, 255), same for G and B, with each channel clamped to 255 maximum. First identify the RGB values of the left light (an RGB(90, 43, 100) colored light) and the right light (an RGB(28, 29, 128) colored light), then calculate the mixed color by adding their RGB components channel by channel. Fill the white-bordered mixing zone in the center with the resulting mixed color and show the full calculation process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000002/final_frame.png b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..973fe9506d044e4f5da51d8598ac50d953baa2ee Binary files /dev/null and b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/final_frame.png differ diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000002/first_frame.png b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3e9fbc8ae9cbe62de128a4b5bd8be3ff5eaeb93f Binary files /dev/null and b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/first_frame.png differ diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000002/ground_truth.mp4 b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..05c5fc8b8f0d2b7881f212a518d2145ca00ef234 --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b716e418fa968f968d8faefb9d36eb2eff1291ad3ff6e067620ac6069e812c2 +size 114531 diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000002/metadata.json b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d36499b1022d8194c0a897e38be387aa907a625a --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/metadata.json @@ -0,0 +1,32 @@ +{ + "task_id": "color_mixing_00000002", + "generator": "color_mixing", + "timestamp": "2026-02-17T07:41:50.069242", + "parameters": { + "color1": [ + 35, + 80, + 69 + ], + "color2": [ + 1, + 33, + 6 + ], + "result": [ + 36, + 113, + 75 + ] + }, + "param_hash": "e6f7c353080ae922", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_mixing_task/color_mixing_00000002/prompt.txt b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e2b2ebbfc93a96d7fa057455ca4b024837d596b --- /dev/null +++ b/VBVR-Dataset/color_mixing_task/color_mixing_00000002/prompt.txt @@ -0,0 +1 @@ +The scene has two colored light sources positioned on the left and right sides, and a mixing zone marked by a white rectangular border in the center. In additive color mixing (light mixing), when two lights overlap, their RGB components add together: result_R = min(color1_R + color2_R, 255), same for G and B, with each channel clamped to 255 maximum. First identify the RGB values of the left light (an RGB(35, 80, 69) colored light) and the right light (a black/dark light), then calculate the mixed color by adding their RGB components channel by channel. Fill the white-bordered mixing zone in the center with the resulting mixed color and show the full calculation process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/final_frame.png b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6595d038b28c2bad0ade1d851f45177ea689617f Binary files /dev/null and b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/final_frame.png differ diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/first_frame.png b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d3d97a54bdabc35240402aa89331631c01c09f6f Binary files /dev/null and b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/first_frame.png differ diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/ground_truth.mp4 b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e98942f6fb0cc7867fcbe8233fd4de2757274f45 --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3949cf3ce90054cf0fdc768fb2fcfb942b294ab2834762281697206eda3e33b5 +size 431319 diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/metadata.json b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8736af85e5dfbd25e82aa359bc6588383aee9f8f --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "color_subtraction_00000000", + "generator": "color_subtraction", + "timestamp": "2026-02-17T07:40:38.919684", + "parameters": { + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 292, + 470 + ], + "color": [ + 102, + 249, + 238 + ], + "radius": 120 + }, + { + "symbol": "ball", + "initial_center": [ + 428, + 771 + ], + "color": [ + 187, + 74, + 68 + ], + "radius": 120 + }, + { + "symbol": "ball", + "final_center": [ + 360.0, + 620.5 + ], + "color": [ + 27, + 0, + 14 + ], + "radius": 120 + } + ] + }, + "param_hash": "88ee229d4ffa214a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/prompt.txt b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3b4609ad2b76e20d8c4838c4781b21c401c46007 --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000000/prompt.txt @@ -0,0 +1 @@ +Two colored balls start at different positions. Animate them moving toward each other at equal speeds until they merge. When overlapping, show subtractive color mixing in the overlap region. Stop when fully merged at the midpoint. \ No newline at end of file diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/final_frame.png b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e5317ba1b4216e111092ebf9cd80973fb2bab1fa Binary files /dev/null and b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/final_frame.png differ diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/first_frame.png b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..237a806ef73693b1c13f840be19c7f67ad1bdc43 Binary files /dev/null and b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/first_frame.png differ diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/ground_truth.mp4 b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..459914cf6e49f2acd4543fdf8feb2e9772fa6fc2 --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50f45364e28fdd74b08e1bec33dacf8d526b2fdbecf1b6fd1d97e31ffd38fec +size 417251 diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/metadata.json b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d571f06f92fb0b08de69d61a5f3a1c96e3ddec57 --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "color_subtraction_00000001", + "generator": "color_subtraction", + "timestamp": "2026-02-17T07:40:40.524517", + "parameters": { + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 198, + 398 + ], + "color": [ + 83, + 56, + 76 + ], + "radius": 120 + }, + { + "symbol": "ball", + "initial_center": [ + 699, + 813 + ], + "color": [ + 159, + 217, + 88 + ], + "radius": 120 + }, + { + "symbol": "ball", + "final_center": [ + 448.5, + 605.5 + ], + "color": [ + 29, + 0, + 102 + ], + "radius": 120 + } + ] + }, + "param_hash": "655f641ad124f752", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/prompt.txt b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d35b48c9858dd5f0cf302c744d29202a8c4ee1ab --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000001/prompt.txt @@ -0,0 +1 @@ +Animate two colored balls moving toward each other at identical speeds. Use subtractive color mixing in overlapping regions. Stop the animation when both balls fully merge at the midpoint. \ No newline at end of file diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/final_frame.png b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..69c147af8725417e4d7568755494e79099f1988d Binary files /dev/null and b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/final_frame.png differ diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/first_frame.png b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b34f3da6230b2721325415c9bd82437899d268cc Binary files /dev/null and b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/first_frame.png differ diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/ground_truth.mp4 b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..825557e6c8a0bc8af58acdf3acfe49d844b26e1b --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4919ad938557b762bfd96102e9a743a88440e10294c4dd22d390957084ccf2f +size 432292 diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/metadata.json b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..20585521a2d2628fa2869922066c9144aadee5ac --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "color_subtraction_00000002", + "generator": "color_subtraction", + "timestamp": "2026-02-17T07:40:42.543924", + "parameters": { + "objects": [ + { + "symbol": "ball", + "initial_center": [ + 270, + 173 + ], + "color": [ + 153, + 198, + 168 + ], + "radius": 120 + }, + { + "symbol": "ball", + "initial_center": [ + 648, + 371 + ], + "color": [ + 102, + 238, + 139 + ], + "radius": 120 + }, + { + "symbol": "ball", + "final_center": [ + 459.0, + 272.0 + ], + "color": [ + 106, + 0, + 76 + ], + "radius": 120 + } + ] + }, + "param_hash": "8bc2d65b485f5027", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/prompt.txt b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d35b48c9858dd5f0cf302c744d29202a8c4ee1ab --- /dev/null +++ b/VBVR-Dataset/color_subtraction_task/color_subtraction_00000002/prompt.txt @@ -0,0 +1 @@ +Animate two colored balls moving toward each other at identical speeds. Use subtractive color mixing in overlapping regions. Stop the animation when both balls fully merge at the midpoint. \ No newline at end of file diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/final_frame.png b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..133265592602872837b3c5a8d688ead0deb82450 Binary files /dev/null and b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/final_frame.png differ diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/first_frame.png b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bcad716e3e0d10660da8f92b344b013cbb0ba21c Binary files /dev/null and b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/first_frame.png differ diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/ground_truth.mp4 b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3956d0ddfe3e264a930ecfd2e52042bcb7fc5bb3 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0967055e3774e02ac77b2552cc3f874c37ab5b4892208c49dc966a56dec04721 +size 187865 diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/metadata.json b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a3961b13870f40e077434caf0553782492a76fec --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/metadata.json @@ -0,0 +1,57 @@ +{ + "task_id": "combined_objects_spinning_00000000", + "generator": "combined_objects_spinning", + "timestamp": "2026-02-17T07:26:32.915385", + "parameters": { + "objects": [ + { + "shape": "circle", + "color": [ + 180, + 180, + 180 + ], + "size": 88, + "start_angle": -36, + "target_angle": 63, + "start_center": [ + 343.327676, + 512.0 + ], + "target_center": [ + 678.903512, + 512.0 + ] + }, + { + "shape": "triangle", + "color": [ + 120, + 175, + 235 + ], + "size": 93, + "start_angle": 82, + "target_angle": -11, + "start_center": [ + 163.232746, + 512.0 + ], + "target_center": [ + 878.243351, + 512.0 + ] + } + ] + }, + "param_hash": "051f3c9b13cc0eb1", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/prompt.txt b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e0d465562c14b50965c539bc0e3ebdfe0c094b6 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 2 objects on the left side and dashed target outlines on the right side. The dashed target outlines remain completely stationary. For each object, first rotate it in place to match the orientation of its corresponding dashed target outline, then move it horizontally to the right so that it aligns exactly with and fits within its corresponding dashed target outline. \ No newline at end of file diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/final_frame.png b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f2b858e906f1379102bb00c923b23e9c76637900 Binary files /dev/null and b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/final_frame.png differ diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/first_frame.png b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..cf59f8a88b694ad7f5e33dfb53a386afbad2fcc3 Binary files /dev/null and b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/first_frame.png differ diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/ground_truth.mp4 b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..9ac4279a25bd8bbefb899ec709ea78e239f98215 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd32f3b4e03b3adc35fa95372cfe92d20ff078572514ed4c261249ea66f3e14 +size 223953 diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/metadata.json b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a09c18bf42be7d5c4041a278caf65c33ad30c2fb --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/metadata.json @@ -0,0 +1,57 @@ +{ + "task_id": "combined_objects_spinning_00000001", + "generator": "combined_objects_spinning", + "timestamp": "2026-02-17T07:26:37.297630", + "parameters": { + "objects": [ + { + "shape": "pentagon", + "color": [ + 120, + 200, + 160 + ], + "size": 81, + "start_angle": 50, + "target_angle": -41, + "start_center": [ + 360.692139, + 512.0 + ], + "target_center": [ + 673.378179, + 512.0 + ] + }, + { + "shape": "circle", + "color": [ + 120, + 175, + 235 + ], + "size": 91, + "start_angle": -64, + "target_angle": 5, + "start_center": [ + 188.889451, + 512.0 + ], + "target_center": [ + 874.332243, + 512.0 + ] + } + ] + }, + "param_hash": "c70187a63e00e6e0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/prompt.txt b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e0d465562c14b50965c539bc0e3ebdfe0c094b6 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 2 objects on the left side and dashed target outlines on the right side. The dashed target outlines remain completely stationary. For each object, first rotate it in place to match the orientation of its corresponding dashed target outline, then move it horizontally to the right so that it aligns exactly with and fits within its corresponding dashed target outline. \ No newline at end of file diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/final_frame.png b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6f7398511d91c91dae7b5522b26a77968b414448 Binary files /dev/null and b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/final_frame.png differ diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/first_frame.png b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..52ed59642b4bda9388c14bfd9a05d2bee1d1be70 Binary files /dev/null and b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/first_frame.png differ diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/ground_truth.mp4 b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6724271dc65dfcdba16ef02657bfc35435275102 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310b450e71912d77eb08dfbbcbd21a47d59f41d6fd75a99f258bf069b94dfde6 +size 189094 diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/metadata.json b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..99d2a8d4a5346a792c278e64ca89cf308dc02324 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/metadata.json @@ -0,0 +1,57 @@ +{ + "task_id": "combined_objects_spinning_00000002", + "generator": "combined_objects_spinning", + "timestamp": "2026-02-17T07:26:37.756528", + "parameters": { + "objects": [ + { + "shape": "circle", + "color": [ + 230, + 170, + 95 + ], + "size": 91, + "start_angle": 59, + "target_angle": -69, + "start_center": [ + 348.377127, + 422.382494 + ], + "target_center": [ + 867.959183, + 422.382494 + ] + }, + { + "shape": "pentagon", + "color": [ + 200, + 140, + 220 + ], + "size": 91, + "start_angle": -10, + "target_angle": 12, + "start_center": [ + 348.377127, + 603.0 + ], + "target_center": [ + 658.592259, + 603.0 + ] + } + ] + }, + "param_hash": "2456315481677593", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/prompt.txt b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e0d465562c14b50965c539bc0e3ebdfe0c094b6 --- /dev/null +++ b/VBVR-Dataset/combined_objects_spinning_task/combined_objects_spinning_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 2 objects on the left side and dashed target outlines on the right side. The dashed target outlines remain completely stationary. For each object, first rotate it in place to match the orientation of its corresponding dashed target outline, then move it horizontally to the right so that it aligns exactly with and fits within its corresponding dashed target outline. \ No newline at end of file diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/final_frame.png b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..be37eeef9e97ac64b2ad5779d00bc591caf4227d Binary files /dev/null and b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/final_frame.png differ diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/first_frame.png b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e91be2cfbe1dbbd097ddb8cf787b259cd7e5dfe5 Binary files /dev/null and b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/first_frame.png differ diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/ground_truth.mp4 b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a4446dc99695b13f660d718b131754efd61ce52d --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe0b27299a65bee6cb7ad37b9c9138162a80547d9b2f8016b4dabd523202d648 +size 395684 diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/metadata.json b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..56e43ceae7e9668066398894da57f596d9a78e12 --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/metadata.json @@ -0,0 +1,53 @@ +{ + "task_id": "communicating_vessels_00000000", + "generator": "communicating_vessels", + "timestamp": "2026-02-17T08:06:53.208239", + "parameters": { + "num_tubes": 3, + "liquid_type": "water", + "liquid_color": "blue", + "viscosity_description": "water-like (low viscosity)", + "decay_constant": 3.57, + "gravity": 9.8, + "gravity_body": "Earth", + "total_time": 1.215537, + "equilibrium_level": 521.666667, + "equilibrium_level_cm": 52, + "tubes": [ + { + "symbol": "tube_0", + "index": 0, + "initial_level": 515.0, + "initial_level_cm": 51, + "final_level": 521.57971, + "final_level_cm": 52 + }, + { + "symbol": "tube_1", + "index": 1, + "initial_level": 490.0, + "initial_level_cm": 49, + "final_level": 521.253623, + "final_level_cm": 52 + }, + { + "symbol": "tube_2", + "index": 2, + "initial_level": 560.0, + "initial_level_cm": 56, + "final_level": 522.166667, + "final_level_cm": 52 + } + ] + }, + "param_hash": "32c19e2af84faf3a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/prompt.txt b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c83fdafda6f0e64f32759d74026b07d61d88aa68 --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000000/prompt.txt @@ -0,0 +1 @@ +A system of 3 communicating vessels with equal-diameter vertical tubes is filled with water (water-like (low viscosity)), which appears blue in color. As shown in the initial frame, the liquid levels in the tubes are [51, 49, 56] cm respectively. Due to pressure differences between the tubes, the liquid begins to flow through the connecting channels at the bottom. The flow is governed by hydrostatic pressure equalization and damped by viscous resistance with coefficient k=3.57. As the liquid redistributes, the height differences gradually decrease, and the system evolves toward equilibrium. Eventually, through conservation of volume, all tubes reach the same final liquid level, which equals the average of the initial heights. Simulate this settling process from the initial unbalanced state to the final stable equilibrium. \ No newline at end of file diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/final_frame.png b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a26090989e3b29297556cde0ef0f17194ecb908b Binary files /dev/null and b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/final_frame.png differ diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/first_frame.png b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0016d3239b0aab4f70cc7078f3b3d6887a6f9511 Binary files /dev/null and b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/first_frame.png differ diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/ground_truth.mp4 b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..1dbc14e940a7210e9abc17aa3dece37386861d24 --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6c5fb2b34ca7f64d11ced58ce2477778488dbfd038893c417b3a6dd6507e2c +size 459453 diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/metadata.json b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6890f72f8f743c15277b2d1eb5fe1d6770e1d18b --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "communicating_vessels_00000001", + "generator": "communicating_vessels", + "timestamp": "2026-02-17T08:06:53.937505", + "parameters": { + "num_tubes": 4, + "liquid_type": "oil", + "liquid_color": "yellow", + "viscosity_description": "oil-like (medium viscosity)", + "decay_constant": 2.39, + "gravity": 9.8, + "gravity_body": "Earth", + "total_time": 2.477087, + "equilibrium_level": 313.75, + "equilibrium_level_cm": 31, + "tubes": [ + { + "symbol": "tube_0", + "index": 0, + "initial_level": 500.0, + "initial_level_cm": 50, + "final_level": 314.25, + "final_level_cm": 31 + }, + { + "symbol": "tube_1", + "index": 1, + "initial_level": 210.0, + "initial_level_cm": 21, + "final_level": 313.471477, + "final_level_cm": 31 + }, + { + "symbol": "tube_2", + "index": 2, + "initial_level": 300.0, + "initial_level_cm": 30, + "final_level": 313.713087, + "final_level_cm": 31 + }, + { + "symbol": "tube_3", + "index": 3, + "initial_level": 245.0, + "initial_level_cm": 24, + "final_level": 313.565436, + "final_level_cm": 31 + } + ] + }, + "param_hash": "bbd0b39c24f46b97", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/prompt.txt b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9e3cbd43c03dd7d5b6f65d84f4ae6f5ff30cc81b --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000001/prompt.txt @@ -0,0 +1 @@ +A system of 4 communicating vessels with equal-diameter vertical tubes is filled with oil (oil-like (medium viscosity)), which appears yellow in color. As shown in the initial frame, the liquid levels in the tubes are [50, 21, 30, 24] cm respectively. Due to pressure differences between the tubes, the liquid begins to flow through the connecting channels at the bottom. The flow is governed by hydrostatic pressure equalization and damped by viscous resistance with coefficient k=2.39. As the liquid redistributes, the height differences gradually decrease, and the system evolves toward equilibrium. Eventually, through conservation of volume, all tubes reach the same final liquid level, which equals the average of the initial heights. Simulate this settling process from the initial unbalanced state to the final stable equilibrium. \ No newline at end of file diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/final_frame.png b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a1b84c5870561626adf357a29a4658cc05cd98e7 Binary files /dev/null and b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/final_frame.png differ diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/first_frame.png b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c49148c065068f92e4151e2846847feff16c78a3 Binary files /dev/null and b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/first_frame.png differ diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/ground_truth.mp4 b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..844ee727bf8847360357a6f11fa7c27b95f1429f --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51aa1a744a7050c6667b1c5e1ba7de0372fa9cc7d2066ac5ba484b90ed6f4678 +size 316785 diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/metadata.json b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b6595f740e64bd764fe051d831c5942df9866173 --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/metadata.json @@ -0,0 +1,45 @@ +{ + "task_id": "communicating_vessels_00000002", + "generator": "communicating_vessels", + "timestamp": "2026-02-17T08:06:54.613197", + "parameters": { + "num_tubes": 2, + "liquid_type": "oil", + "liquid_color": "yellow", + "viscosity_description": "oil-like (medium viscosity)", + "decay_constant": 2.31, + "gravity": 9.8, + "gravity_body": "Earth", + "total_time": 2.123496, + "equilibrium_level": 482.5, + "equilibrium_level_cm": 48, + "tubes": [ + { + "symbol": "tube_0", + "index": 0, + "initial_level": 415.0, + "initial_level_cm": 41, + "final_level": 482.0, + "final_level_cm": 48 + }, + { + "symbol": "tube_1", + "index": 1, + "initial_level": 550.0, + "initial_level_cm": 55, + "final_level": 483.0, + "final_level_cm": 48 + } + ] + }, + "param_hash": "899872cc65951950", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/prompt.txt b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..91c5c3555d236c616fb6eea5a137a3b487abfe35 --- /dev/null +++ b/VBVR-Dataset/communicating_vessels_task/communicating_vessels_00000002/prompt.txt @@ -0,0 +1 @@ +A system of 2 communicating vessels with equal-diameter vertical tubes is filled with oil (oil-like (medium viscosity)), which appears yellow in color. As shown in the initial frame, the liquid levels in the tubes are [41, 55] cm respectively. Due to pressure differences between the tubes, the liquid begins to flow through the connecting channels at the bottom. The flow is governed by hydrostatic pressure equalization and damped by viscous resistance with coefficient k=2.31. As the liquid redistributes, the height differences gradually decrease, and the system evolves toward equilibrium. Eventually, through conservation of volume, all tubes reach the same final liquid level, which equals the average of the initial heights. Simulate this settling process from the initial unbalanced state to the final stable equilibrium. \ No newline at end of file diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/final_frame.png b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..63f2c2096a36bb51285dce4252ad60ab35f8dabe Binary files /dev/null and b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/final_frame.png differ diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/first_frame.png b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3eb09e24f8fdeb33e4992821361200fa11e88bec Binary files /dev/null and b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/first_frame.png differ diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/ground_truth.mp4 b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..bc5a55b044ef71acbc952ec1f7273d1237ffcdc6 --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:831feeb0542a3cae5ff7680614e681aeebc0aceea781be49d7da37635f0d3f8f +size 136459 diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/metadata.json b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a27391fb6d5cf03f266c5b529f93180eda247f8e --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/metadata.json @@ -0,0 +1,42 @@ +{ + "task_id": "complete_missing_contour_segments_00000000", + "generator": "complete_missing_contour_segments", + "timestamp": "2026-02-17T07:31:31.096809", + "parameters": { + "shapes": [ + { + "type": "triangle", + "vertices": [ + [ + 647, + 189 + ], + [ + 938, + 700 + ], + [ + 350, + 695 + ] + ], + "missing_edge_idx": 1, + "color": [ + 50, + 50, + 50 + ] + } + ] + }, + "param_hash": "479d968f498da9e4", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/prompt.txt b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2fde686dc884c0d9e040308cd1d282d34c130b8 --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 1 geometric shape. It has exactly one missing edge (a gap between two visible endpoints where an edge is not drawn). First locate the two endpoints of the missing edge, then draw a single straight line segment connecting them to complete the shape. Do not redraw existing edges or add any extra lines. Show the drawing process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/final_frame.png b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ae94bc53d01c604bb7c1832307420935cc8bf10e Binary files /dev/null and b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/final_frame.png differ diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/first_frame.png b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a2845224b3fcf602a62c3869f11a602ec3f8335b Binary files /dev/null and b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/first_frame.png differ diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/ground_truth.mp4 b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a1b2c6dc71116e93a671d30650627344e2892874 --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4555717d47e2f6f878780fba606dfdd68e1e19f9c250a9cf552d2738f3394d59 +size 158321 diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/metadata.json b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..afa8fb8d6b7350eb0f3d144156654161af6af67f --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/metadata.json @@ -0,0 +1,77 @@ +{ + "task_id": "complete_missing_contour_segments_00000001", + "generator": "complete_missing_contour_segments", + "timestamp": "2026-02-17T07:31:31.594251", + "parameters": { + "shapes": [ + { + "type": "quadrilateral", + "vertices": [ + [ + 188, + 601 + ], + [ + 466, + 581 + ], + [ + 486, + 859 + ], + [ + 208, + 879 + ] + ], + "missing_edge_idx": 2, + "color": [ + 0, + 128, + 128 + ] + }, + { + "type": "pentagon", + "vertices": [ + [ + 459, + 320 + ], + [ + 267, + 376 + ], + [ + 154, + 211 + ], + [ + 277, + 52 + ], + [ + 465, + 120 + ] + ], + "missing_edge_idx": 1, + "color": [ + 128, + 0, + 128 + ] + } + ] + }, + "param_hash": "8f494bbf35fb78ee", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/prompt.txt b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..dbfcd90f9ad24e842bcdd468abf505db0d9e41d3 --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 2 geometric shapes. Each shape has exactly one missing edge (a gap between two visible endpoints where an edge is not drawn). First locate the two endpoints of each missing edge, then draw a single straight line segment connecting them to complete the shape. Do not redraw existing edges or add any extra lines. Show the drawing process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/final_frame.png b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..645b10f06dd61362a9e590f8f2568dfb9aaa7ed9 Binary files /dev/null and b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/final_frame.png differ diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/first_frame.png b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3b8253484940a4f4954e6c1b18dbee61072f11de Binary files /dev/null and b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/first_frame.png differ diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/ground_truth.mp4 b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7136bd92e6b7405032af7569fda8b2005dc5118d --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c913e5cfbd889dbec2891eadf3709f2b9c6c0edbadb01f50748f421126acfbf3 +size 164550 diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/metadata.json b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..110eb091772185597fa875a1e2c327b7a001cbe1 --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/metadata.json @@ -0,0 +1,46 @@ +{ + "task_id": "complete_missing_contour_segments_00000002", + "generator": "complete_missing_contour_segments", + "timestamp": "2026-02-17T07:31:32.096891", + "parameters": { + "shapes": [ + { + "type": "quadrilateral", + "vertices": [ + [ + 379, + 717 + ], + [ + 462, + 252 + ], + [ + 927, + 335 + ], + [ + 844, + 800 + ] + ], + "missing_edge_idx": 3, + "color": [ + 128, + 0, + 128 + ] + } + ] + }, + "param_hash": "72a1af4b57ff8e86", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/prompt.txt b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c2fde686dc884c0d9e040308cd1d282d34c130b8 --- /dev/null +++ b/VBVR-Dataset/complete_missing_contour_segments_task/complete_missing_contour_segments_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 1 geometric shape. It has exactly one missing edge (a gap between two visible endpoints where an edge is not drawn). First locate the two endpoints of the missing edge, then draw a single straight line segment connecting them to complete the shape. Do not redraw existing edges or add any extra lines. Show the drawing process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/final_frame.png b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c02ee77dfbe33b71e47579c725680acf8018edbf Binary files /dev/null and b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/final_frame.png differ diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/first_frame.png b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..10cba3a83f7c54a247ee452796fb9e0bcadfed73 Binary files /dev/null and b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/first_frame.png differ diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/ground_truth.mp4 b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..97131205290d2601b25328cab588f26408157fc4 --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db25ff8153ebb71b8789ea293599269aa939da327888b92d1db2ad8c267b143 +size 394785 diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/metadata.json b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..13eeab5729bfb0d9ed107835d3a2d7564faabdee --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/metadata.json @@ -0,0 +1,37 @@ +{ + "task_id": "construct_concentric_ring_00000000", + "generator": "construct_concentric_ring", + "timestamp": "2026-02-17T07:05:03.507905", + "parameters": { + "outer_radius": 352, + "inner_radius": 237, + "outer_color": [ + 255, + 225, + 25 + ], + "inner_color": [ + 255, + 215, + 180 + ], + "outer_start_position": [ + 366, + 307 + ], + "inner_start_position": [ + 773, + 716 + ] + }, + "param_hash": "03707c50a52f77d9", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/prompt.txt b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d7d4427fc2aa39229850395c78d03e0b46147ea --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000000/prompt.txt @@ -0,0 +1,3 @@ +The scene shows two circles of the same color but different sizes at different positions. +Keep both circles unchanged in size and color. Only move their positions. +Move both circles until they share the same center point (concentric circles) exactly at the center of the image. \ No newline at end of file diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/final_frame.png b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..513a0671b98902861d3e7e8dc77a44682a7e99a6 Binary files /dev/null and b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/final_frame.png differ diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/first_frame.png b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e1ae491384604388848a8d388981d787c5f64485 Binary files /dev/null and b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/first_frame.png differ diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/ground_truth.mp4 b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2b30a1d4fcedfdc750cee71dadd226c3bb63fe80 --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8254f235487032bae79ff328a0b2034f1cee248345fe3aca867c1bd48240f765 +size 576520 diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/metadata.json b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..26d3ac8c4644c0c282e0938ed129dd311dd15acf --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/metadata.json @@ -0,0 +1,37 @@ +{ + "task_id": "construct_concentric_ring_00000001", + "generator": "construct_concentric_ring", + "timestamp": "2026-02-17T07:05:03.945470", + "parameters": { + "outer_radius": 322, + "inner_radius": 168, + "outer_color": [ + 240, + 50, + 230 + ], + "inner_color": [ + 170, + 110, + 40 + ], + "outer_start_position": [ + 336, + 307 + ], + "inner_start_position": [ + 842, + 716 + ] + }, + "param_hash": "cea47abd1139caf0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/prompt.txt b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d7d4427fc2aa39229850395c78d03e0b46147ea --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000001/prompt.txt @@ -0,0 +1,3 @@ +The scene shows two circles of the same color but different sizes at different positions. +Keep both circles unchanged in size and color. Only move their positions. +Move both circles until they share the same center point (concentric circles) exactly at the center of the image. \ No newline at end of file diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/final_frame.png b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7323916ac8937d37527acd96d350699cac374a9d Binary files /dev/null and b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/final_frame.png differ diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/first_frame.png b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1cb7d10d26a5a03318bd7392262a8bf79206aa3d Binary files /dev/null and b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/first_frame.png differ diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/ground_truth.mp4 b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..1d59eab7c8e8b86045b533b5ed6768c60c97383e --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0032f6819fbec2669e6168b9b159a17e2487ee00ef0c21ab2b5c684f55b8cc +size 758105 diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/metadata.json b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5f17e6ff33c13097354582a5299269b8814047a0 --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/metadata.json @@ -0,0 +1,37 @@ +{ + "task_id": "construct_concentric_ring_00000002", + "generator": "construct_concentric_ring", + "timestamp": "2026-02-17T07:05:04.413793", + "parameters": { + "outer_radius": 390, + "inner_radius": 177, + "outer_color": [ + 72, + 61, + 139 + ], + "inner_color": [ + 72, + 61, + 139 + ], + "outer_start_position": [ + 404, + 307 + ], + "inner_start_position": [ + 833, + 716 + ] + }, + "param_hash": "4ed0c6ce79262b8e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/prompt.txt b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d7d4427fc2aa39229850395c78d03e0b46147ea --- /dev/null +++ b/VBVR-Dataset/construct_concentric_ring_task/construct_concentric_ring_00000002/prompt.txt @@ -0,0 +1,3 @@ +The scene shows two circles of the same color but different sizes at different positions. +Keep both circles unchanged in size and color. Only move their positions. +Move both circles until they share the same center point (concentric circles) exactly at the center of the image. \ No newline at end of file diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/final_frame.png b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..074dbf8418c8b92b7b84d770f64c095d3edaa4da Binary files /dev/null and b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/final_frame.png differ diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/first_frame.png b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ebab61d11139c1f4141eb176fb156a1fee78d977 Binary files /dev/null and b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/first_frame.png differ diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/ground_truth.mp4 b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f633ca140ac46fda6f2308764d65bb25d52c8862 --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8ad309b693966ab3f121d6ae8c12a64f7dbad1b05ce291d450aa7d301d409ce +size 301292 diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/metadata.json b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b175501f543f91d541928b5fb4619944f3e400b5 --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/metadata.json @@ -0,0 +1,214 @@ +{ + "task_id": "construction_blueprint_00000000", + "generator": "construction_blueprint", + "timestamp": "2026-02-17T07:42:14.741832", + "parameters": { + "correct_index": 0, + "grid_size": 21, + "structure": { + "blocks": [ + [ + 11, + 10 + ], + [ + 10, + 8 + ], + [ + 12, + 10 + ], + [ + 13, + 10 + ], + [ + 9, + 8 + ], + [ + 10, + 9 + ], + [ + 11, + 8 + ], + [ + 12, + 11 + ], + [ + 11, + 11 + ], + [ + 9, + 9 + ], + [ + 8, + 7 + ], + [ + 11, + 9 + ], + [ + 11, + 12 + ], + [ + 10, + 10 + ], + [ + 12, + 12 + ], + [ + 9, + 7 + ] + ], + "color": [ + 75, + 0, + 130 + ] + }, + "gap": { + "grid_positions": [ + [ + 9, + 10 + ], + [ + 9, + 11 + ], + [ + 10, + 11 + ], + [ + 8, + 11 + ] + ], + "center": [ + 460.0, + 448.0 + ] + }, + "candidates": [ + { + "candidate_index": 0, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 1, + 1 + ], + [ + 2, + 1 + ], + [ + 0, + 1 + ] + ], + "center": [ + 142, + 921 + ], + "is_correct": true + }, + { + "candidate_index": 1, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 1, + 1 + ], + [ + 1, + 2 + ], + [ + 0, + 1 + ] + ], + "center": [ + 388, + 921 + ], + "is_correct": false + }, + { + "candidate_index": 2, + "grid_positions": [ + [ + 0, + 1 + ], + [ + 1, + 1 + ], + [ + 0, + 0 + ] + ], + "center": [ + 634, + 921 + ], + "is_correct": false + }, + { + "candidate_index": 3, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 0, + 1 + ], + [ + 0, + 0 + ] + ], + "center": [ + 880, + 921 + ], + "is_correct": false + } + ] + }, + "param_hash": "d0a460d74f3c94d5", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/prompt.txt b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ab2d760b372b60ab1b23d56016c38cd3976811c --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000000/prompt.txt @@ -0,0 +1 @@ +In the scene, the upper structure has a missing piece outlined with a dashed line. There are 4 candidate pieces below. The video sequentially checks each candidate from left to right: highlights the current candidate being examined with a frame, previews how the piece fits in the gap, marks it with ✓ if the shape matches or ✗ if it doesn't, then moves to the next candidate. Once the matching piece is found, an animation demonstrates it moving into the gap to complete the structure. \ No newline at end of file diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/final_frame.png b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6c1c1d2c2f2d7fe4b5168d8d7a8ca89bb371742f Binary files /dev/null and b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/final_frame.png differ diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/first_frame.png b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f035ab99b326805f34061e7623d4451ec686d514 Binary files /dev/null and b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/first_frame.png differ diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/ground_truth.mp4 b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..225d6d028d1e0b355d4cd2a8be585fa441d41180 --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02d44da7c87e89ce17b02007192051ac3f3dcf61db1bf13f3a6ab8ca8230999 +size 451550 diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/metadata.json b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..997db294995902f717edab9f30e0340bb7f3fd0a --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/metadata.json @@ -0,0 +1,214 @@ +{ + "task_id": "construction_blueprint_00000001", + "generator": "construction_blueprint", + "timestamp": "2026-02-17T07:42:15.803369", + "parameters": { + "correct_index": 2, + "grid_size": 21, + "structure": { + "blocks": [ + [ + 9, + 10 + ], + [ + 10, + 11 + ], + [ + 11, + 10 + ], + [ + 11, + 9 + ], + [ + 12, + 9 + ], + [ + 10, + 10 + ], + [ + 13, + 9 + ], + [ + 12, + 11 + ], + [ + 10, + 12 + ], + [ + 12, + 8 + ], + [ + 11, + 11 + ] + ], + "color": [ + 139, + 90, + 60 + ] + }, + "gap": { + "grid_positions": [ + [ + 13, + 8 + ], + [ + 14, + 8 + ], + [ + 15, + 8 + ], + [ + 13, + 7 + ], + [ + 14, + 7 + ] + ], + "center": [ + 709.6, + 284.2 + ] + }, + "candidates": [ + { + "candidate_index": 0, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 1, + 1 + ], + [ + 2, + 1 + ], + [ + 0, + 0 + ] + ], + "center": [ + 142, + 921 + ], + "is_correct": false + }, + { + "candidate_index": 1, + "grid_positions": [ + [ + 0, + 1 + ], + [ + 0, + 0 + ], + [ + 1, + 1 + ], + [ + 0, + 2 + ], + [ + 1, + 0 + ] + ], + "center": [ + 388, + 921 + ], + "is_correct": false + }, + { + "candidate_index": 2, + "grid_positions": [ + [ + 0, + 1 + ], + [ + 2, + 1 + ], + [ + 0, + 0 + ], + [ + 1, + 1 + ], + [ + 1, + 0 + ] + ], + "center": [ + 634, + 921 + ], + "is_correct": true + }, + { + "candidate_index": 3, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 0, + 1 + ], + [ + 2, + 1 + ], + [ + 0, + 0 + ] + ], + "center": [ + 880, + 921 + ], + "is_correct": false + } + ] + }, + "param_hash": "c79f9503e0f11d1d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/prompt.txt b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ab2d760b372b60ab1b23d56016c38cd3976811c --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000001/prompt.txt @@ -0,0 +1 @@ +In the scene, the upper structure has a missing piece outlined with a dashed line. There are 4 candidate pieces below. The video sequentially checks each candidate from left to right: highlights the current candidate being examined with a frame, previews how the piece fits in the gap, marks it with ✓ if the shape matches or ✗ if it doesn't, then moves to the next candidate. Once the matching piece is found, an animation demonstrates it moving into the gap to complete the structure. \ No newline at end of file diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/final_frame.png b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..602d3912c2f6763beaf76df366a64bce8fe23ccf Binary files /dev/null and b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/final_frame.png differ diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/first_frame.png b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..461666276d662f8adbb40b65eaf2e9d0df05eac4 Binary files /dev/null and b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/first_frame.png differ diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/ground_truth.mp4 b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..aadaf5e6db88a4753ce273ca21517632b774af55 --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58616edd9b413e9e3884955a44bdd63149e4e2c64868e31dd316d1d903084ceb +size 403785 diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/metadata.json b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f269cc64b3c3c3a70d56b13f48dd4cae3b4e20d6 --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/metadata.json @@ -0,0 +1,190 @@ +{ + "task_id": "construction_blueprint_00000002", + "generator": "construction_blueprint", + "timestamp": "2026-02-17T07:42:16.693174", + "parameters": { + "correct_index": 2, + "grid_size": 21, + "structure": { + "blocks": [ + [ + 9, + 10 + ], + [ + 10, + 11 + ], + [ + 11, + 10 + ], + [ + 10, + 8 + ], + [ + 10, + 9 + ], + [ + 9, + 11 + ], + [ + 11, + 8 + ], + [ + 12, + 11 + ], + [ + 10, + 12 + ], + [ + 13, + 11 + ], + [ + 11, + 11 + ], + [ + 9, + 9 + ], + [ + 11, + 9 + ], + [ + 12, + 9 + ], + [ + 10, + 10 + ], + [ + 13, + 9 + ], + [ + 12, + 12 + ], + [ + 13, + 12 + ] + ], + "color": [ + 160, + 82, + 45 + ] + }, + "gap": { + "grid_positions": [ + [ + 12, + 10 + ], + [ + 13, + 10 + ] + ], + "center": [ + 642.0, + 409.0 + ] + }, + "candidates": [ + { + "candidate_index": 0, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 0, + 1 + ], + [ + 0, + 0 + ] + ], + "center": [ + 142, + 921 + ], + "is_correct": false + }, + { + "candidate_index": 1, + "grid_positions": [ + [ + 0, + 1 + ], + [ + 0, + 0 + ] + ], + "center": [ + 388, + 921 + ], + "is_correct": false + }, + { + "candidate_index": 2, + "grid_positions": [ + [ + 1, + 0 + ], + [ + 0, + 0 + ] + ], + "center": [ + 634, + 921 + ], + "is_correct": true + }, + { + "candidate_index": 3, + "grid_positions": [ + [ + 0, + 0 + ] + ], + "center": [ + 880, + 921 + ], + "is_correct": false + } + ] + }, + "param_hash": "1f2416fdf3f965b7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/prompt.txt b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3ab2d760b372b60ab1b23d56016c38cd3976811c --- /dev/null +++ b/VBVR-Dataset/construction_blueprint_task/construction_blueprint_00000002/prompt.txt @@ -0,0 +1 @@ +In the scene, the upper structure has a missing piece outlined with a dashed line. There are 4 candidate pieces below. The video sequentially checks each candidate from left to right: highlights the current candidate being examined with a frame, previews how the piece fits in the gap, marks it with ✓ if the shape matches or ✗ if it doesn't, then moves to the next candidate. Once the matching piece is found, an animation demonstrates it moving into the gap to complete the structure. \ No newline at end of file diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000000/final_frame.png b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d192e1c6978b74d7ac0195f90bcbca1839ca3a09 Binary files /dev/null and b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/final_frame.png differ diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000000/first_frame.png b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5b731bc00c1172a27a3a7fcc5b76e52646dc74f5 Binary files /dev/null and b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/first_frame.png differ diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000000/ground_truth.mp4 b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..87c43dce046e34ac03c5f39b6ff88ca878cb69f6 --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e026117e645004d7629e24a305c95926d70366fdc6303f9a61b680985e3672a +size 137164 diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000000/metadata.json b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9dfcadac86d7f02665def5590a159266ff8470f4 --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/metadata.json @@ -0,0 +1,96 @@ +{ + "task_id": "counting_objects_00000000", + "generator": "counting_objects", + "timestamp": "2026-02-26T09:54:39.136345", + "parameters": { + "num_objects": 5, + "object_shape": "mixed", + "objects": [ + { + "symbol": "object", + "index": 0, + "shape": "circle", + "color": [ + 100, + 255, + 100 + ], + "center": [ + 687, + 898 + ], + "size": 50 + }, + { + "symbol": "object", + "index": 1, + "shape": "circle", + "color": [ + 100, + 150, + 255 + ], + "center": [ + 887, + 692 + ], + "size": 58 + }, + { + "symbol": "object", + "index": 2, + "shape": "triangle", + "color": [ + 255, + 200, + 100 + ], + "center": [ + 562, + 678 + ], + "size": 51 + }, + { + "symbol": "object", + "index": 3, + "shape": "triangle", + "color": [ + 255, + 100, + 100 + ], + "center": [ + 192, + 370 + ], + "size": 56 + }, + { + "symbol": "object", + "index": 4, + "shape": "star", + "color": [ + 255, + 100, + 100 + ], + "center": [ + 328, + 671 + ], + "size": 77 + } + ] + }, + "param_hash": "843518348286f8e9", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000000/prompt.txt b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..31a49574421b5a2c44ca48167932e2c52c8080b5 --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000000/prompt.txt @@ -0,0 +1 @@ +The scene displays various geometric objects scattered across the image. Each object is a filled shape with a black outline. Starting from any position in the image, systematically count all visible objects in the scene, regardless of their shape or color. Count each object exactly once, highlighting its border when counting that object, ensuring no object is missed or counted multiple times. After completing the count, display 'Count: N' in the center of the image, where N is the total number of objects found in the scene. \ No newline at end of file diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000001/final_frame.png b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..630019f878ec0145a692b3f6e78b8c0cf452dd8d Binary files /dev/null and b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/final_frame.png differ diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000001/first_frame.png b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3d3917e379f18a92d7c7eb22fe204fa8a29766c4 Binary files /dev/null and b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/first_frame.png differ diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000001/ground_truth.mp4 b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5a2fa14cddce2378eb3f53bb54128b52cbd67d3c --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5c8c25b6762d630ef1229355790823c5e72a90304ff1968d267dac6ff20c26 +size 123845 diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000001/metadata.json b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..c1ebec24120c4b6c21d435d963c8120586e84fe8 --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/metadata.json @@ -0,0 +1,81 @@ +{ + "task_id": "counting_objects_00000001", + "generator": "counting_objects", + "timestamp": "2026-02-26T09:54:39.482680", + "parameters": { + "num_objects": 4, + "object_shape": "mixed", + "objects": [ + { + "symbol": "object", + "index": 0, + "shape": "circle", + "color": [ + 200, + 100, + 255 + ], + "center": [ + 123, + 693 + ], + "size": 51 + }, + { + "symbol": "object", + "index": 1, + "shape": "square", + "color": [ + 255, + 200, + 100 + ], + "center": [ + 198, + 530 + ], + "size": 60 + }, + { + "symbol": "object", + "index": 2, + "shape": "triangle", + "color": [ + 100, + 150, + 255 + ], + "center": [ + 682, + 320 + ], + "size": 72 + }, + { + "symbol": "object", + "index": 3, + "shape": "star", + "color": [ + 100, + 255, + 100 + ], + "center": [ + 918, + 744 + ], + "size": 71 + } + ] + }, + "param_hash": "edcfe6d30602ef77", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000001/prompt.txt b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..31a49574421b5a2c44ca48167932e2c52c8080b5 --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000001/prompt.txt @@ -0,0 +1 @@ +The scene displays various geometric objects scattered across the image. Each object is a filled shape with a black outline. Starting from any position in the image, systematically count all visible objects in the scene, regardless of their shape or color. Count each object exactly once, highlighting its border when counting that object, ensuring no object is missed or counted multiple times. After completing the count, display 'Count: N' in the center of the image, where N is the total number of objects found in the scene. \ No newline at end of file diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000002/final_frame.png b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..047d6c927b4d7f4bd05b99f270196550b2db5c59 Binary files /dev/null and b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/final_frame.png differ diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000002/first_frame.png b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f0ba4435f157fff9e790402bd083d0bd319c2c63 Binary files /dev/null and b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/first_frame.png differ diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000002/ground_truth.mp4 b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d4f47ad0140eb310a9424b360e70ec3c3240d1db --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2ee1862ef90f709aebec8fd36b6c490875de4e2d59dae4f769902cd009fb4b +size 274700 diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000002/metadata.json b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..e4f99298ad85db834c5b54a4ec6ba7d50586dedc --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/metadata.json @@ -0,0 +1,171 @@ +{ + "task_id": "counting_objects_00000002", + "generator": "counting_objects", + "timestamp": "2026-02-26T09:54:40.089069", + "parameters": { + "num_objects": 10, + "object_shape": "mixed", + "objects": [ + { + "symbol": "object", + "index": 0, + "shape": "triangle", + "color": [ + 255, + 100, + 100 + ], + "center": [ + 54, + 624 + ], + "size": 76 + }, + { + "symbol": "object", + "index": 1, + "shape": "star", + "color": [ + 255, + 100, + 100 + ], + "center": [ + 854, + 94 + ], + "size": 61 + }, + { + "symbol": "object", + "index": 2, + "shape": "triangle", + "color": [ + 255, + 200, + 100 + ], + "center": [ + 768, + 395 + ], + "size": 72 + }, + { + "symbol": "object", + "index": 3, + "shape": "star", + "color": [ + 100, + 150, + 255 + ], + "center": [ + 687, + 666 + ], + "size": 63 + }, + { + "symbol": "object", + "index": 4, + "shape": "star", + "color": [ + 100, + 255, + 100 + ], + "center": [ + 334, + 393 + ], + "size": 63 + }, + { + "symbol": "object", + "index": 5, + "shape": "star", + "color": [ + 255, + 200, + 100 + ], + "center": [ + 917, + 816 + ], + "size": 78 + }, + { + "symbol": "object", + "index": 6, + "shape": "triangle", + "color": [ + 100, + 255, + 100 + ], + "center": [ + 626, + 426 + ], + "size": 89 + }, + { + "symbol": "object", + "index": 7, + "shape": "triangle", + "color": [ + 100, + 150, + 255 + ], + "center": [ + 495, + 562 + ], + "size": 95 + }, + { + "symbol": "object", + "index": 8, + "shape": "circle", + "color": [ + 255, + 200, + 100 + ], + "center": [ + 673, + 935 + ], + "size": 62 + }, + { + "symbol": "object", + "index": 9, + "shape": "circle", + "color": [ + 255, + 200, + 100 + ], + "center": [ + 179, + 206 + ], + "size": 93 + } + ] + }, + "param_hash": "1b5dfd2c0acd7ac6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/counting_objects_task/counting_objects_00000002/prompt.txt b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..31a49574421b5a2c44ca48167932e2c52c8080b5 --- /dev/null +++ b/VBVR-Dataset/counting_objects_task/counting_objects_00000002/prompt.txt @@ -0,0 +1 @@ +The scene displays various geometric objects scattered across the image. Each object is a filled shape with a black outline. Starting from any position in the image, systematically count all visible objects in the scene, regardless of their shape or color. Count each object exactly once, highlighting its border when counting that object, ensuring no object is missed or counted multiple times. After completing the count, display 'Count: N' in the center of the image, where N is the total number of objects found in the scene. \ No newline at end of file diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/final_frame.png b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..39a8d8a5224a6af8fa5e8f4b4c91cef5a7f74d76 Binary files /dev/null and b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/final_frame.png differ diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/first_frame.png b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..646e37248b9d0e9729cc474b84a1622e4c20c286 Binary files /dev/null and b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/first_frame.png differ diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/ground_truth.mp4 b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..35d22f9fcd20e7aba38c1701c4ff08a40c5cc483 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5cb702e83517e97bc2b6705a408ff795a14c5a753d25ecb9c1752eb1014977 +size 314640 diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/metadata.json b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d50b3d30b1df24ea1e5633a47b9be4e8b196f520 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/metadata.json @@ -0,0 +1,83 @@ +{ + "task_id": "directed_graph_navigation_00000000", + "generator": "directed_graph_navigation", + "timestamp": "2026-02-17T07:21:11.114899", + "parameters": { + "num_nodes": 5, + "positions": [ + [ + 897, + 855 + ], + [ + 649, + 198 + ], + [ + 175, + 780 + ], + [ + 671, + 762 + ], + [ + 924, + 436 + ] + ], + "edges": [ + [ + 0, + 1 + ], + [ + 1, + 2 + ], + [ + 1, + 3 + ], + [ + 1, + 4 + ], + [ + 4, + 0 + ], + [ + 0, + 3 + ], + [ + 2, + 0 + ], + [ + 3, + 2 + ] + ], + "start_node": 3, + "end_node": 4, + "shortest_path": [ + 3, + 2, + 0, + 1, + 4 + ] + }, + "param_hash": "05416c51d668641a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/prompt.txt b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bc53410a283c43ef80822242c95f25490cb4b89 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a network of nodes connected by directed edges (edges with arrows indicating direction) with a green starting node, a red ending node, and a blue triangular agent positioned at the green starting node. The agent can only move along edges in the direction they point (from the source node to the target node, cannot move backwards), moving from one node to an adjacent node each step. Move the blue triangular agent from the green starting node to the red ending node along the path with the minimum number of steps. \ No newline at end of file diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/final_frame.png b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b836bf36db30fca56dd2431c5e40dd17e6c863f4 Binary files /dev/null and b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/final_frame.png differ diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/first_frame.png b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..90b84e2a2349cc9fbadc869fec611067d42f0e08 Binary files /dev/null and b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/first_frame.png differ diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/ground_truth.mp4 b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2408296fc4b91cd2c4d5dc7b8828460cebe8da3e --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd61f8a952d731a808204baa422d5ce6498d6792c7217d60c7e0632b8d647763 +size 252935 diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/metadata.json b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8cb377046fa733a3f309f8d2c4f42e62c7448175 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/metadata.json @@ -0,0 +1,98 @@ +{ + "task_id": "directed_graph_navigation_00000001", + "generator": "directed_graph_navigation", + "timestamp": "2026-02-17T07:21:11.545990", + "parameters": { + "num_nodes": 7, + "positions": [ + [ + 454, + 654 + ], + [ + 456, + 888 + ], + [ + 120, + 664 + ], + [ + 227, + 220 + ], + [ + 321, + 414 + ], + [ + 822, + 577 + ], + [ + 449, + 322 + ] + ], + "edges": [ + [ + 0, + 1 + ], + [ + 1, + 2 + ], + [ + 0, + 3 + ], + [ + 2, + 4 + ], + [ + 4, + 5 + ], + [ + 4, + 6 + ], + [ + 3, + 6 + ], + [ + 3, + 4 + ], + [ + 5, + 1 + ], + [ + 4, + 1 + ] + ], + "start_node": 1, + "end_node": 6, + "shortest_path": [ + 1, + 2, + 4, + 6 + ] + }, + "param_hash": "6e786d4164b8c4a7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/prompt.txt b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bc53410a283c43ef80822242c95f25490cb4b89 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a network of nodes connected by directed edges (edges with arrows indicating direction) with a green starting node, a red ending node, and a blue triangular agent positioned at the green starting node. The agent can only move along edges in the direction they point (from the source node to the target node, cannot move backwards), moving from one node to an adjacent node each step. Move the blue triangular agent from the green starting node to the red ending node along the path with the minimum number of steps. \ No newline at end of file diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/final_frame.png b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dad94aaf456861b87699731c92d58570e425af5e Binary files /dev/null and b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/final_frame.png differ diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/first_frame.png b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..eca348fb4639631bb7556df3ab95c765d74d4cdd Binary files /dev/null and b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/first_frame.png differ diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/ground_truth.mp4 b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..fc2c61c6e80b7a984139c2446153b904b86d459a --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921e2711eab96622251a0c1ba8ad6c7c1c3a53c4b7b3a1d93e8b9a507776f067 +size 264189 diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/metadata.json b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..de4c31ea865cfbc409e819dbf6d031943ff25c92 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/metadata.json @@ -0,0 +1,98 @@ +{ + "task_id": "directed_graph_navigation_00000002", + "generator": "directed_graph_navigation", + "timestamp": "2026-02-17T07:21:12.002048", + "parameters": { + "num_nodes": 7, + "positions": [ + [ + 774, + 455 + ], + [ + 621, + 278 + ], + [ + 275, + 127 + ], + [ + 836, + 651 + ], + [ + 366, + 540 + ], + [ + 767, + 195 + ], + [ + 121, + 598 + ] + ], + "edges": [ + [ + 0, + 1 + ], + [ + 1, + 2 + ], + [ + 1, + 3 + ], + [ + 1, + 4 + ], + [ + 3, + 5 + ], + [ + 0, + 6 + ], + [ + 5, + 1 + ], + [ + 6, + 2 + ], + [ + 5, + 0 + ], + [ + 6, + 3 + ] + ], + "start_node": 3, + "end_node": 6, + "shortest_path": [ + 3, + 5, + 0, + 6 + ] + }, + "param_hash": "58defff875cead9d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/prompt.txt b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bc53410a283c43ef80822242c95f25490cb4b89 --- /dev/null +++ b/VBVR-Dataset/directed_graph_navigation_task/directed_graph_navigation_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a network of nodes connected by directed edges (edges with arrows indicating direction) with a green starting node, a red ending node, and a blue triangular agent positioned at the green starting node. The agent can only move along edges in the direction they point (from the source node to the target node, cannot move backwards), moving from one node to an adjacent node each step. Move the blue triangular agent from the green starting node to the red ending node along the path with the minimum number of steps. \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/final_frame.png b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9d15f2b90652e82ba0482794650bf44eb1432a5d Binary files /dev/null and b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/final_frame.png differ diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/first_frame.png b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b8f954a8658ec4a1c6915394a450236763c9ae3e Binary files /dev/null and b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/first_frame.png differ diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/ground_truth.mp4 b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..57db584e85c1a46b3616cc9b69acf1f5952f9c3d --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0dd353cefe666cc0567226ed6ba7c18e369de27999fc446472865807f04717d +size 302541 diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/metadata.json b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..835656e47cd087026b7d561f82230e409e6c6986 --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/metadata.json @@ -0,0 +1,163 @@ +{ + "task_id": "domino_chain_branch_path_prediction_00000000", + "generator": "domino_chain_branch_path_prediction", + "timestamp": "2026-02-17T07:43:51.099791", + "parameters": { + "objects": [ + { + "symbol": "domino", + "id": "START", + "center": [ + 79, + 536 + ], + "branch": "trunk", + "color": [ + 50, + 150, + 50 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "T1", + "center": [ + 214, + 536 + ], + "branch": "trunk", + "color": [ + 75, + 75, + 80 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "T2", + "center": [ + 349, + 536 + ], + "branch": "trunk", + "color": [ + 75, + 75, + 80 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "A1", + "center": [ + 484, + 436 + ], + "branch": "A", + "color": [ + 170, + 55, + 115 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "A2", + "center": [ + 619, + 418.17 + ], + "branch": "A", + "color": [ + 170, + 55, + 115 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B1", + "center": [ + 484, + 636 + ], + "branch": "B", + "color": [ + 100, + 150, + 210 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B2", + "center": [ + 619, + 653.83 + ], + "branch": "B", + "color": [ + 100, + 150, + 210 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B3", + "center": [ + 754, + 671.66 + ], + "branch": "B", + "color": [ + 100, + 150, + 210 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B4", + "center": [ + 889, + 689.49 + ], + "branch": "B", + "color": [ + 100, + 150, + 210 + ], + "angle": 0, + "will_fall": true + } + ] + }, + "param_hash": "4df0c7b6cc00f232", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/prompt.txt b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..dfb7283b4cfa1d3220ba0e3fc42bd430463f1a3a --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000000/prompt.txt @@ -0,0 +1 @@ +Push the green START domino to begin the chain reaction. Show the complete domino falling process. The dominos fall step by step from left to right, turning darker as they fall. The gray trunk falls first, then splits into the red Branch A (upward) and blue Branch B (downward). Both branches complete successfully The final state shows all dominos fallen and tilted right. \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/final_frame.png b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fdd5abaeaee2e31ef3e61ab92355e0b056c163d0 Binary files /dev/null and b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/final_frame.png differ diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/first_frame.png b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..880fee6c95328e6fcc71459e3cb9df7677e0cae6 Binary files /dev/null and b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/first_frame.png differ diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/ground_truth.mp4 b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4b24d260be077e532f6e1a0178d628a98ba66ae1 --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9923608951c13f492e26793d1f129e5ca308114af1724d935401a184915cf1 +size 276876 diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/metadata.json b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..be2bc0c39b83e564b1c62caa3915af0fa0e6d393 --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/metadata.json @@ -0,0 +1,149 @@ +{ + "task_id": "domino_chain_branch_path_prediction_00000001", + "generator": "domino_chain_branch_path_prediction", + "timestamp": "2026-02-17T07:43:51.790858", + "parameters": { + "blocked_branch": "B", + "block_after_index": 0, + "objects": [ + { + "symbol": "domino", + "id": "START", + "center": [ + 68, + 483 + ], + "branch": "trunk", + "color": [ + 70, + 170, + 70 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "T1", + "center": [ + 202, + 483 + ], + "branch": "trunk", + "color": [ + 75, + 75, + 85 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "T2", + "center": [ + 336, + 483 + ], + "branch": "trunk", + "color": [ + 75, + 75, + 85 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "T3", + "center": [ + 470, + 483 + ], + "branch": "trunk", + "color": [ + 75, + 75, + 85 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "A1", + "center": [ + 604, + 393 + ], + "branch": "A", + "color": [ + 180, + 50, + 110 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "A2", + "center": [ + 738, + 379.56 + ], + "branch": "A", + "color": [ + 180, + 50, + 110 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B1", + "center": [ + 604, + 573 + ], + "branch": "B", + "color": [ + 35, + 75, + 170 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B2", + "center": [ + 738, + 586.44 + ], + "branch": "B", + "color": [ + 35, + 75, + 170 + ], + "angle": 0, + "will_fall": false + } + ] + }, + "param_hash": "31d025b51ad493cc", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/prompt.txt b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fba2d2d2d133bab300d019d7e1a38dd22c7aadb3 --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000001/prompt.txt @@ -0,0 +1 @@ +Push the green START domino to begin the chain reaction. Show the complete domino falling process. The dominos fall step by step from left to right, turning darker as they fall. The gray trunk falls first, then splits into the red Branch A (upward) and indigo Branch B (downward). Branch B has a gap marked with a red X that stops the chain reaction in that branch The final state shows Branch B with fallen dominos before the gap and standing dominos after, while Branch A completes fully. \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/final_frame.png b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c1483bd4e6ec6fc0563affdcb0f1c1ac66f06058 Binary files /dev/null and b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/final_frame.png differ diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/first_frame.png b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7f5f80f2353dcf397bf1b5c51582dd0ebd263c51 Binary files /dev/null and b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/first_frame.png differ diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/ground_truth.mp4 b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6395cc000fd9c3c7b44b29d21a9816f5e0ff6bdc --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0900239eef5f4f04527dedf80c131d287b8176e320ad2fd2ded5eb52707a0400 +size 262653 diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/metadata.json b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4ed865f8e899fcdfcd362f09b55d276c9b2b2a55 --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/metadata.json @@ -0,0 +1,131 @@ +{ + "task_id": "domino_chain_branch_path_prediction_00000002", + "generator": "domino_chain_branch_path_prediction", + "timestamp": "2026-02-17T07:43:52.418855", + "parameters": { + "objects": [ + { + "symbol": "domino", + "id": "START", + "center": [ + 90, + 513 + ], + "branch": "trunk", + "color": [ + 90, + 210, + 90 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "T1", + "center": [ + 225, + 513 + ], + "branch": "trunk", + "color": [ + 70, + 65, + 60 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "A1", + "center": [ + 360, + 419 + ], + "branch": "A", + "color": [ + 200, + 60, + 120 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "A2", + "center": [ + 495, + 392.93 + ], + "branch": "A", + "color": [ + 200, + 60, + 120 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B1", + "center": [ + 360, + 607 + ], + "branch": "B", + "color": [ + 30, + 70, + 160 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B2", + "center": [ + 495, + 633.07 + ], + "branch": "B", + "color": [ + 30, + 70, + 160 + ], + "angle": 0, + "will_fall": true + }, + { + "symbol": "domino", + "id": "B3", + "center": [ + 630, + 659.15 + ], + "branch": "B", + "color": [ + 30, + 70, + 160 + ], + "angle": 0, + "will_fall": true + } + ] + }, + "param_hash": "ebb2003dfd959ed7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/prompt.txt b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..f16f3b2d15b6ae900eb53f6572eae44cc3845ba5 --- /dev/null +++ b/VBVR-Dataset/domino_chain_branch_path_prediction_task/domino_chain_branch_path_prediction_00000002/prompt.txt @@ -0,0 +1 @@ +Push the bright green START domino to begin the chain reaction. Show the complete domino falling process. The dominos fall step by step from left to right, turning darker as they fall. The dark gray trunk falls first, then splits into the red Branch A (upward) and indigo Branch B (downward). Both branches complete successfully The final state shows all dominos fallen and tilted right. \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/final_frame.png b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fefc209b5020c1766d014463d03f5c5e0f05fb3c Binary files /dev/null and b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/final_frame.png differ diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/first_frame.png b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2ce0e45ddc97d04fc5fb919af918fd3ccc3bed5e Binary files /dev/null and b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/first_frame.png differ diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/ground_truth.mp4 b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cf5d3720d29340be5ac1183576411ae53a8301c0 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd69f6f6fe7ef98c6df7c62495eb4df853ee4589136528dc4ddc6fc583f49fbb +size 585528 diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/metadata.json b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..38875c147f27e035a7a0d5dad147c40e98aa121f --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/metadata.json @@ -0,0 +1,150 @@ +{ + "task_id": "domino_chain_gap_analysis_00000000", + "generator": "domino_chain_gap_analysis", + "timestamp": "2026-02-17T07:44:43.810761", + "parameters": { + "gap_after": 5, + "answer": 6, + "last_fallen_index": 5, + "objects": [ + { + "symbol": "domino", + "index": 1, + "center": [ + 191, + 618.5 + ], + "position": 191, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 2, + "center": [ + 275, + 618.5 + ], + "position": 275, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 3, + "center": [ + 341, + 618.5 + ], + "position": 341, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 4, + "center": [ + 407, + 618.5 + ], + "position": 407, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 5, + "center": [ + 498, + 618.5 + ], + "position": 498, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 6, + "center": [ + 565, + 618.5 + ], + "position": 565, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": true + }, + { + "symbol": "domino", + "index": 7, + "center": [ + 766, + 618.5 + ], + "position": 766, + "color": [ + 30, + 144, + 255 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 8, + "center": [ + 842, + 618.5 + ], + "position": 842, + "color": [ + 30, + 144, + 255 + ], + "is_fallen": false, + "is_last_fallen": false + } + ] + }, + "param_hash": "7bb469234dc853b1", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/prompt.txt b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..27e2a0a996dc9452a8082ec46f224fd5a91f9e07 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000000/prompt.txt @@ -0,0 +1 @@ +Analyze the domino chain to find which domino is the last to fall. Push the first domino and watch as each domino falls and turns red. The chain will stop when it reaches a gap that is too wide. This gap will be marked "TOO FAR!" in red. The last fallen domino will be circled in green as the answer. \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/final_frame.png b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..27b606f54d8a23f6e8118f15c6f55a10495ca1f6 Binary files /dev/null and b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/final_frame.png differ diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/first_frame.png b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f3468a94d50816a1a87ca20d185b64ad87c5daec Binary files /dev/null and b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/first_frame.png differ diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/ground_truth.mp4 b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..714ecf0443a4a90b1192f095fb61c49fa27b0587 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702df72152c81ddb9bb5918c95c32e5b1f9c46b75e40f4c384f6019e6834a8f1 +size 429051 diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/metadata.json b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..18626653427f16b48e618ecb4820bdd7415e7aa4 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/metadata.json @@ -0,0 +1,198 @@ +{ + "task_id": "domino_chain_gap_analysis_00000001", + "generator": "domino_chain_gap_analysis", + "timestamp": "2026-02-17T07:44:44.621280", + "parameters": { + "gap_after": 1, + "answer": 2, + "last_fallen_index": 1, + "objects": [ + { + "symbol": "domino", + "index": 1, + "center": [ + 177, + 666.5 + ], + "position": 177, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 2, + "center": [ + 254, + 666.5 + ], + "position": 254, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": true + }, + { + "symbol": "domino", + "index": 3, + "center": [ + 473, + 666.5 + ], + "position": 473, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 4, + "center": [ + 542, + 666.5 + ], + "position": 542, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 5, + "center": [ + 617, + 666.5 + ], + "position": 617, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 6, + "center": [ + 688, + 666.5 + ], + "position": 688, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 7, + "center": [ + 751, + 666.5 + ], + "position": 751, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 8, + "center": [ + 831, + 666.5 + ], + "position": 831, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 9, + "center": [ + 899, + 666.5 + ], + "position": 899, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 10, + "center": [ + 958, + 666.5 + ], + "position": 958, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 11, + "center": [ + 1035, + 666.5 + ], + "position": 1035, + "color": [ + 0, + 206, + 209 + ], + "is_fallen": false, + "is_last_fallen": false + } + ] + }, + "param_hash": "62fa6bfc18cd2463", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/prompt.txt b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..27e2a0a996dc9452a8082ec46f224fd5a91f9e07 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000001/prompt.txt @@ -0,0 +1 @@ +Analyze the domino chain to find which domino is the last to fall. Push the first domino and watch as each domino falls and turns red. The chain will stop when it reaches a gap that is too wide. This gap will be marked "TOO FAR!" in red. The last fallen domino will be circled in green as the answer. \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/final_frame.png b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..94839e14433521d7ad4a18914d2232f5343df5ed Binary files /dev/null and b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/final_frame.png differ diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/first_frame.png b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3fc16175991129c728142c37f21e942a7a81d756 Binary files /dev/null and b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/first_frame.png differ diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/ground_truth.mp4 b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..375db46994d13ef2fe60f13055bc819a0c61f221 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ebdd5ed45a118d9feb28b5faa1d922132ec9b1843f35b893da35ed25b2921c +size 520925 diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/metadata.json b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a721e25faf72c36531deb3ef1923bd440bbe1f0d --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/metadata.json @@ -0,0 +1,150 @@ +{ + "task_id": "domino_chain_gap_analysis_00000002", + "generator": "domino_chain_gap_analysis", + "timestamp": "2026-02-17T07:44:45.758616", + "parameters": { + "gap_after": 4, + "answer": 5, + "last_fallen_index": 4, + "objects": [ + { + "symbol": "domino", + "index": 1, + "center": [ + 160, + 630.0 + ], + "position": 160, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 2, + "center": [ + 243, + 630.0 + ], + "position": 243, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 3, + "center": [ + 331, + 630.0 + ], + "position": 331, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 4, + "center": [ + 416, + 630.0 + ], + "position": 416, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 5, + "center": [ + 507, + 630.0 + ], + "position": 507, + "color": [ + 231, + 76, + 60 + ], + "is_fallen": true, + "is_last_fallen": true + }, + { + "symbol": "domino", + "index": 6, + "center": [ + 710, + 630.0 + ], + "position": 710, + "color": [ + 243, + 156, + 18 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 7, + "center": [ + 792, + 630.0 + ], + "position": 792, + "color": [ + 243, + 156, + 18 + ], + "is_fallen": false, + "is_last_fallen": false + }, + { + "symbol": "domino", + "index": 8, + "center": [ + 853, + 630.0 + ], + "position": 853, + "color": [ + 243, + 156, + 18 + ], + "is_fallen": false, + "is_last_fallen": false + } + ] + }, + "param_hash": "d2834e28852854e6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/prompt.txt b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..27e2a0a996dc9452a8082ec46f224fd5a91f9e07 --- /dev/null +++ b/VBVR-Dataset/domino_chain_gap_analysis_task/domino_chain_gap_analysis_00000002/prompt.txt @@ -0,0 +1 @@ +Analyze the domino chain to find which domino is the last to fall. Push the first domino and watch as each domino falls and turns red. The chain will stop when it reaches a gap that is too wide. This gap will be marked "TOO FAR!" in red. The last fallen domino will be circled in green as the answer. \ No newline at end of file diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/final_frame.png b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0e3803aa28bdc44932842ee771a0ceb711f224ee Binary files /dev/null and b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/final_frame.png differ diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/first_frame.png b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0bb02053f07ab24be8195886d172df63d5c3b9a1 Binary files /dev/null and b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/first_frame.png differ diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/ground_truth.mp4 b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2020e9b2c18d9a283506acc5a939892f0a5bc99a --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1b4fb3edc85110433219f32d6cd184b9cab598d5adc1400496bbfd1f09de64 +size 343466 diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/metadata.json b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..02b5f59a7f531dcba1f83075e1024dce7eee9217 --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/metadata.json @@ -0,0 +1,106 @@ +{ + "task_id": "dot_to_dot_00000000", + "generator": "dot_to_dot", + "timestamp": "2026-02-26T09:55:02.809128", + "parameters": { + "num_dots": 5, + "connection_type": "sequential", + "line_color": [ + 255, + 80, + 80 + ], + "objects": [ + { + "symbol": "dot", + "index": 0, + "number": 1, + "center": [ + 684, + 233 + ], + "color": [ + 255, + 100, + 150 + ], + "radius": 45, + "next_dot_index": 1 + }, + { + "symbol": "dot", + "index": 1, + "number": 2, + "center": [ + 210, + 815 + ], + "color": [ + 255, + 255, + 100 + ], + "radius": 45, + "next_dot_index": 2 + }, + { + "symbol": "dot", + "index": 2, + "number": 3, + "center": [ + 706, + 797 + ], + "color": [ + 150, + 255, + 100 + ], + "radius": 45, + "next_dot_index": 3 + }, + { + "symbol": "dot", + "index": 3, + "number": 4, + "center": [ + 471, + 445 + ], + "color": [ + 100, + 150, + 255 + ], + "radius": 45, + "next_dot_index": 4 + }, + { + "symbol": "dot", + "index": 4, + "number": 5, + "center": [ + 268, + 160 + ], + "color": [ + 255, + 200, + 100 + ], + "radius": 45, + "next_dot_index": null + } + ] + }, + "param_hash": "63bf165613ef11cd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/prompt.txt b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..77cb4174c004d427848e5023c2ba2a31f655d2e5 --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 5 numbered dots scattered across the image. Connect the dots in numerical order (1→2→3→...→5) by drawing red straight lines between them, one line at a time in sequence. \ No newline at end of file diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/final_frame.png b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c4482e507d0c14a1b123cc78ca30e9728f632656 Binary files /dev/null and b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/final_frame.png differ diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/first_frame.png b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6f78bffa4dafa35b60448da6e0abd79a8747d4f6 Binary files /dev/null and b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/first_frame.png differ diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/ground_truth.mp4 b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0bcec161e28325340ca72293d82816ee447e82fe --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5549e641c10aa4a7a6dca97b5dd36dadb573ec277da3372f956ba19e8048ef5a +size 738533 diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/metadata.json b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa84d4d042782a3c5a3e340f772a402d9a38bb0 --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/metadata.json @@ -0,0 +1,154 @@ +{ + "task_id": "dot_to_dot_00000001", + "generator": "dot_to_dot", + "timestamp": "2026-02-26T09:55:04.731583", + "parameters": { + "num_dots": 8, + "connection_type": "sequential", + "line_color": [ + 255, + 80, + 80 + ], + "objects": [ + { + "symbol": "dot", + "index": 0, + "number": 1, + "center": [ + 798, + 732 + ], + "color": [ + 255, + 150, + 100 + ], + "radius": 45, + "next_dot_index": 1 + }, + { + "symbol": "dot", + "index": 1, + "number": 2, + "center": [ + 477, + 547 + ], + "color": [ + 255, + 255, + 100 + ], + "radius": 45, + "next_dot_index": 2 + }, + { + "symbol": "dot", + "index": 2, + "number": 3, + "center": [ + 345, + 889 + ], + "color": [ + 255, + 150, + 100 + ], + "radius": 45, + "next_dot_index": 3 + }, + { + "symbol": "dot", + "index": 3, + "number": 4, + "center": [ + 492, + 208 + ], + "color": [ + 100, + 255, + 255 + ], + "radius": 45, + "next_dot_index": 4 + }, + { + "symbol": "dot", + "index": 4, + "number": 5, + "center": [ + 778, + 283 + ], + "color": [ + 100, + 255, + 255 + ], + "radius": 45, + "next_dot_index": 5 + }, + { + "symbol": "dot", + "index": 5, + "number": 6, + "center": [ + 156, + 310 + ], + "color": [ + 100, + 150, + 255 + ], + "radius": 45, + "next_dot_index": 6 + }, + { + "symbol": "dot", + "index": 6, + "number": 7, + "center": [ + 565, + 870 + ], + "color": [ + 255, + 100, + 150 + ], + "radius": 45, + "next_dot_index": 7 + }, + { + "symbol": "dot", + "index": 7, + "number": 8, + "center": [ + 861, + 515 + ], + "color": [ + 255, + 100, + 150 + ], + "radius": 45, + "next_dot_index": null + } + ] + }, + "param_hash": "985e52718459dd35", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/prompt.txt b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..65edbe9cadabbd94fde53cb240c74a15473dadb4 --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 8 numbered dots scattered across the image. Connect the dots in numerical order (1→2→3→...→8) by drawing red straight lines between them, one line at a time in sequence. \ No newline at end of file diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/final_frame.png b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d24704fda6b98f16ffb5e218fb09f6e2d2c35918 Binary files /dev/null and b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/final_frame.png differ diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/first_frame.png b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a25d03afa68951a0f24fb37862aaddb49b1796d0 Binary files /dev/null and b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/first_frame.png differ diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/ground_truth.mp4 b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..865283ebd2c3ed37ddc9165492b0cce657711c52 --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c75bca7704a1f7e89d62064e76993d9e8b7cf3a2f7649d87ae91395eb51d00 +size 245017 diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/metadata.json b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ef3f5f7c5cde47c4528009407dd03d2fbd0ecb2d --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/metadata.json @@ -0,0 +1,90 @@ +{ + "task_id": "dot_to_dot_00000002", + "generator": "dot_to_dot", + "timestamp": "2026-02-26T09:55:05.311006", + "parameters": { + "num_dots": 4, + "connection_type": "sequential", + "line_color": [ + 255, + 80, + 80 + ], + "objects": [ + { + "symbol": "dot", + "index": 0, + "number": 1, + "center": [ + 633, + 356 + ], + "color": [ + 100, + 150, + 255 + ], + "radius": 45, + "next_dot_index": 1 + }, + { + "symbol": "dot", + "index": 1, + "number": 2, + "center": [ + 449, + 857 + ], + "color": [ + 100, + 255, + 255 + ], + "radius": 45, + "next_dot_index": 2 + }, + { + "symbol": "dot", + "index": 2, + "number": 3, + "center": [ + 357, + 529 + ], + "color": [ + 200, + 100, + 255 + ], + "radius": 45, + "next_dot_index": 3 + }, + { + "symbol": "dot", + "index": 3, + "number": 4, + "center": [ + 635, + 139 + ], + "color": [ + 100, + 255, + 255 + ], + "radius": 45, + "next_dot_index": null + } + ] + }, + "param_hash": "99e28981c8a67222", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/prompt.txt b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..358b4b34071efd8f0c74da8d599c579b9abeffcd --- /dev/null +++ b/VBVR-Dataset/dot_to_dot_task/dot_to_dot_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 numbered dots scattered across the image. Connect the dots in numerical order (1→2→3→...→4) by drawing red straight lines between them, one line at a time in sequence. \ No newline at end of file diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/final_frame.png b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c0b54522d067a84a2aa42c632361fcc4e7666c61 Binary files /dev/null and b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/final_frame.png differ diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/first_frame.png b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5b4dc87d55e9788bf8bf3edf785bc7e53e0954b1 Binary files /dev/null and b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/first_frame.png differ diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/ground_truth.mp4 b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..47a91066a04229b6b5563dbffb05ca54a558cd74 --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a31afbad3372bd98b75aaabac429313d3eceaba4208a07922634b803bc441a7 +size 179366 diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/metadata.json b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..63975473fa28ebc483e5e625bdfd72512c533741 --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/metadata.json @@ -0,0 +1,69 @@ +{ + "task_id": "find_fragment_for_gap_filling_00000000", + "generator": "find_fragment_for_gap_filling", + "timestamp": "2026-02-17T06:48:49.118212", + "parameters": { + "base_shape": { + "type": "hexagon", + "size": 208, + "color": [ + 0, + 170, + 0 + ] + }, + "cutout": { + "type": "square", + "size": 89 + }, + "candidates": [ + { + "type": "square", + "size": 89, + "color": [ + 0, + 180, + 180 + ] + }, + { + "type": "square", + "size": 64, + "color": [ + 0, + 170, + 0 + ] + }, + { + "type": "square", + "size": 40, + "color": [ + 255, + 105, + 180 + ] + }, + { + "type": "square", + "size": 90, + "color": [ + 0, + 0, + 255 + ] + } + ], + "correct_index": 0 + }, + "param_hash": "728e60e413ea7c77", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/prompt.txt b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b6a4ffe86c82c7368e67bf3808580dbb028b98d --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000000/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top PUZZLE area and a bottom CHOICES area. In the PUZZLE area, the center shape has a missing cut-out outlined in black. In the CHOICES area, there are 4 candidate pieces of the same shape but different sizes. First compare the candidate sizes and determine which single option would fit the missing cut-out exactly (a perfect match in size). Do not use color as a clue. Then circle the correct option. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/final_frame.png b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7687c10a9b19f4cd729f45ecfdd050dcf070146f Binary files /dev/null and b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/final_frame.png differ diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/first_frame.png b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..61b0c7622a2f5e88a4e57fd570f9462fb16ce5dd Binary files /dev/null and b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/first_frame.png differ diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/ground_truth.mp4 b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..dd55067f5ff39d19115847b53278edf1b8cbf109 --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3728cb1c913b8c721c0016a36a861ee5df0b8a8775f1b59ffbc0d5be1e7076d4 +size 194640 diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/metadata.json b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d56a51ca88a9d5362021151dd10cf8379bb82f66 --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/metadata.json @@ -0,0 +1,69 @@ +{ + "task_id": "find_fragment_for_gap_filling_00000001", + "generator": "find_fragment_for_gap_filling", + "timestamp": "2026-02-17T06:48:49.545056", + "parameters": { + "base_shape": { + "type": "hexagon", + "size": 204, + "color": [ + 154, + 205, + 50 + ] + }, + "cutout": { + "type": "triangle", + "size": 79 + }, + "candidates": [ + { + "type": "triangle", + "size": 59, + "color": [ + 0, + 170, + 0 + ] + }, + { + "type": "triangle", + "size": 79, + "color": [ + 0, + 0, + 0 + ] + }, + { + "type": "triangle", + "size": 40, + "color": [ + 0, + 0, + 255 + ] + }, + { + "type": "triangle", + "size": 90, + "color": [ + 255, + 105, + 180 + ] + } + ], + "correct_index": 1 + }, + "param_hash": "954733f803b53967", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/prompt.txt b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b6a4ffe86c82c7368e67bf3808580dbb028b98d --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000001/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top PUZZLE area and a bottom CHOICES area. In the PUZZLE area, the center shape has a missing cut-out outlined in black. In the CHOICES area, there are 4 candidate pieces of the same shape but different sizes. First compare the candidate sizes and determine which single option would fit the missing cut-out exactly (a perfect match in size). Do not use color as a clue. Then circle the correct option. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/final_frame.png b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d95f552c23c04bb61fb772bb1d5dc3be584864fe Binary files /dev/null and b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/final_frame.png differ diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/first_frame.png b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0819465e70f25b58976b5b3604cabdf6a9d4f387 Binary files /dev/null and b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/first_frame.png differ diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/ground_truth.mp4 b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7d006045cbb235d7efefb1ec3ffc4c3a8899d044 --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ac68d70f6e4f84644482639ee19d8d6d30c317355edd5070153b554a351672 +size 149051 diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/metadata.json b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..665c350cee906faffa10b37f217b78cf8e9fd962 --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/metadata.json @@ -0,0 +1,69 @@ +{ + "task_id": "find_fragment_for_gap_filling_00000002", + "generator": "find_fragment_for_gap_filling", + "timestamp": "2026-02-17T06:48:49.988360", + "parameters": { + "base_shape": { + "type": "circle", + "size": 208, + "color": [ + 64, + 224, + 208 + ] + }, + "cutout": { + "type": "square", + "size": 43 + }, + "candidates": [ + { + "type": "square", + "size": 43, + "color": [ + 255, + 140, + 0 + ] + }, + { + "type": "square", + "size": 40, + "color": [ + 154, + 205, + 50 + ] + }, + { + "type": "square", + "size": 90, + "color": [ + 0, + 180, + 180 + ] + }, + { + "type": "square", + "size": 67, + "color": [ + 0, + 0, + 255 + ] + } + ], + "correct_index": 0 + }, + "param_hash": "ebb82d6c7715ad44", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/prompt.txt b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b6a4ffe86c82c7368e67bf3808580dbb028b98d --- /dev/null +++ b/VBVR-Dataset/find_fragment_for_gap_filling_task/find_fragment_for_gap_filling_00000002/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top PUZZLE area and a bottom CHOICES area. In the PUZZLE area, the center shape has a missing cut-out outlined in black. In the CHOICES area, there are 4 candidate pieces of the same shape but different sizes. First compare the candidate sizes and determine which single option would fit the missing cut-out exactly (a perfect match in size). Do not use color as a clue. Then circle the correct option. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/final_frame.png b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dedc680a079d76edfc6f6b61d15c4d911b373298 Binary files /dev/null and b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/final_frame.png differ diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/first_frame.png b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b37e8b233c727ef129c2d0c55d397f4275695617 Binary files /dev/null and b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/first_frame.png differ diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/ground_truth.mp4 b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..034d44c68c4723d80d2756465d7e09aaaa33cb7e --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71588d8ae41c4421d9d2d0db8926e3630017a56a1f9c8f7ea3ebdb24786c93f2 +size 357991 diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/metadata.json b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1d3e3999523c7ac67deef40aeff5a2ef79eb84b7 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "find_keys_and_open_doors_00000000", + "generator": "find_keys_and_open_doors", + "timestamp": "2026-02-17T07:29:42.598865", + "parameters": { + "style": "grid", + "agent_start_position": [ + 8, + 5 + ], + "key": { + "pos": [ + 7, + 3 + ], + "color": [ + 255, + 128, + 0 + ] + }, + "door": { + "pos": [ + 1, + 9 + ], + "color": [ + 255, + 255, + 0 + ] + }, + "grid": [ + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1], + [1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1] + ], + "width": 13, + "height": 13 + }, + "param_hash": "f15e1fce24ad27b6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/prompt.txt b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..acbd6cedbbbf06fd719af8f5a6dfbacaf69f29e1 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000000/prompt.txt @@ -0,0 +1 @@ +In the maze, the agent is the green circle. First move the agent to collect the key (diamond shape), then move the agent to the door (hollow rectangle). Use the shortest path for each movement. Show the complete movement step by step. \ No newline at end of file diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/final_frame.png b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4541ded34160f95232dae521711ad525e1c307e1 Binary files /dev/null and b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/final_frame.png differ diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/first_frame.png b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..65131eae7df6df152b60f8a9ae1ed68934a40a7f Binary files /dev/null and b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/first_frame.png differ diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/ground_truth.mp4 b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b24d5f579cc1a1fb88e6479f592750a2b183bd78 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14bdc5d23121f09b85aba86223f53eb94d4f328c089a7dc8ab9dd69c9f3c48e3 +size 494728 diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/metadata.json b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..e89c3b0a521fa840a0d47cef28da2ae3aee064e5 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "find_keys_and_open_doors_00000001", + "generator": "find_keys_and_open_doors", + "timestamp": "2026-02-17T07:29:43.698245", + "parameters": { + "style": "grid", + "agent_start_position": [ + 9, + 1 + ], + "key": { + "pos": [ + 1, + 10 + ], + "color": [ + 255, + 128, + 0 + ] + }, + "door": { + "pos": [ + 11, + 7 + ], + "color": [ + 0, + 255, + 255 + ] + }, + "grid": [ + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1], + [1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1], + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1] + ], + "width": 13, + "height": 13 + }, + "param_hash": "83fa2418daf24baf", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/prompt.txt b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..acbd6cedbbbf06fd719af8f5a6dfbacaf69f29e1 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000001/prompt.txt @@ -0,0 +1 @@ +In the maze, the agent is the green circle. First move the agent to collect the key (diamond shape), then move the agent to the door (hollow rectangle). Use the shortest path for each movement. Show the complete movement step by step. \ No newline at end of file diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/final_frame.png b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a237579665573947ec355cbda0fd8c88095c6a23 Binary files /dev/null and b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/final_frame.png differ diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/first_frame.png b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..083475eee2fb72eb91879eb38dab3472241deed8 Binary files /dev/null and b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/first_frame.png differ diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/ground_truth.mp4 b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a72eeec895e8c27e304b59735d9bdc01cae29526 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0841461fdee04a55e8fc41fec664a8d72b7349958ae39f6ed74ff5d8eb31fa46 +size 682917 diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/metadata.json b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..df60c5525bb66b260d2d2aecca0c4fee572ba369 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "find_keys_and_open_doors_00000002", + "generator": "find_keys_and_open_doors", + "timestamp": "2026-02-17T07:29:45.302123", + "parameters": { + "style": "grid", + "agent_start_position": [ + 4, + 5 + ], + "key": { + "pos": [ + 10, + 11 + ], + "color": [ + 255, + 0, + 255 + ] + }, + "door": { + "pos": [ + 8, + 3 + ], + "color": [ + 255, + 255, + 0 + ] + }, + "grid": [ + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], + [1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1], + [1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1], + [1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1], + [1, 0, 1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1] + ], + "width": 13, + "height": 13 + }, + "param_hash": "1e3c899c3a3d15c9", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/prompt.txt b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..acbd6cedbbbf06fd719af8f5a6dfbacaf69f29e1 --- /dev/null +++ b/VBVR-Dataset/find_keys_and_open_doors_task/find_keys_and_open_doors_00000002/prompt.txt @@ -0,0 +1 @@ +In the maze, the agent is the green circle. First move the agent to collect the key (diamond shape), then move the agent to the door (hollow rectangle). Use the shortest path for each movement. Show the complete movement step by step. \ No newline at end of file diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/final_frame.png b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c0b2e6765263e117aafe4397e5b50926d061598e Binary files /dev/null and b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/final_frame.png differ diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/first_frame.png b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e0b1d5a9b1de7db1ea5dba58de754c55de148e9e Binary files /dev/null and b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/first_frame.png differ diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/ground_truth.mp4 b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..902778a05ec1daa3a7a2e31cc061f118402237ca --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854422c4d336e6a315c9cdfdb02512a1ca1bdb20b91d6473627ae78453a52c52 +size 315857 diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/metadata.json b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..2de2e2f4a3a24aee2eca6fe760473994f208cec2 --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "glass_refraction_00000000", + "generator": "glass_refraction", + "timestamp": "2026-02-17T07:41:22.044763", + "parameters": { + "n_glass": 1.93609, + "n_air": 1.0, + "theta_incident_degrees": 63.391636, + "theta_refracted_degrees": 27.503406, + "objects": [ + { + "symbol": "ray", + "start": [ + 50, + 280.563278 + ], + "end": [ + 512, + 512 + ], + "type": "incident", + "angle_degrees": 63.391636 + }, + { + "symbol": "ray", + "start": [ + 512, + 512 + ], + "end": [ + 752.536884, + 974 + ], + "type": "refracted", + "angle_degrees": 27.503406 + } + ] + }, + "param_hash": "1a4ac4bd0bf01b33", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/prompt.txt b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..60768adf11f99cee7a5d88994531945c2e2115db --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000000/prompt.txt @@ -0,0 +1 @@ +A light ray enters glass from air. The glass refractive index is 1.94, and the incident angle is 63.4 degrees. Using Snell's law, predict how the light ray refracts as it enters the glass. Draw the refracted ray from the point where the incident ray hits the glass surface, extending to the image edge. Show the complete refracted ray path inside the glass. \ No newline at end of file diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/final_frame.png b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..54f9887565eb8648c8c75fc4fe7b4598eb79d072 Binary files /dev/null and b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/final_frame.png differ diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/first_frame.png b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..59938b7fe88555ff8f147c6c8f54ea93ba45dd86 Binary files /dev/null and b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/first_frame.png differ diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/ground_truth.mp4 b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..72b5f9769c26915ff489400ccd18ffd1aec637f9 --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37b5cbc57803f4f3fbf44c5fbd14f5171a0dc556211d5ee4347ceee00440179 +size 261963 diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/metadata.json b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6090d6f1b3be7aec6d9d7b6bc3c4205ebc910771 --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "glass_refraction_00000001", + "generator": "glass_refraction", + "timestamp": "2026-02-17T07:41:22.793613", + "parameters": { + "n_glass": 1.892918, + "n_air": 1.0, + "theta_incident_degrees": 12.223077, + "theta_refracted_degrees": 6.421835, + "objects": [ + { + "symbol": "ray", + "start": [ + 411.917268, + 50 + ], + "end": [ + 512, + 512 + ], + "type": "incident", + "angle_degrees": 12.223077 + }, + { + "symbol": "ray", + "start": [ + 512, + 512 + ], + "end": [ + 563.999892, + 974 + ], + "type": "refracted", + "angle_degrees": 6.421835 + } + ] + }, + "param_hash": "50198f643e8f3134", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/prompt.txt b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2478408c903b1d76bf8c478afba5b89e46ea9025 --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000001/prompt.txt @@ -0,0 +1 @@ +A light ray enters glass from air. The glass refractive index is 1.89, and the incident angle is 12.2 degrees. Using Snell's law, predict how the light ray refracts as it enters the glass. Draw the refracted ray from the point where the incident ray hits the glass surface, extending to the image edge. Show the complete refracted ray path inside the glass. \ No newline at end of file diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/final_frame.png b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4be20a566286eeaa437e93208edf845ca42ef0a0 Binary files /dev/null and b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/final_frame.png differ diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/first_frame.png b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c50a0f62694880b24543807a7e0b01ea52458045 Binary files /dev/null and b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/first_frame.png differ diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/ground_truth.mp4 b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b2badc72ccbe814f43436b5b864c698c21bc3a36 --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f214675ce5d585e4e8176fda5cc3943136b494365b87d79e6bc9245a45e02179 +size 310584 diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/metadata.json b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b475abd7e91c01871ebacd08a3c0513fa39eff3d --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "glass_refraction_00000002", + "generator": "glass_refraction", + "timestamp": "2026-02-17T07:41:23.428430", + "parameters": { + "n_glass": 1.76491, + "n_air": 1.0, + "theta_incident_degrees": 53.497672, + "theta_refracted_degrees": 27.094054, + "objects": [ + { + "symbol": "ray", + "start": [ + 50, + 170.108927 + ], + "end": [ + 512, + 512 + ], + "type": "incident", + "angle_degrees": 53.497672 + }, + { + "symbol": "ray", + "start": [ + 512, + 512 + ], + "end": [ + 748.35685, + 974 + ], + "type": "refracted", + "angle_degrees": 27.094054 + } + ] + }, + "param_hash": "c05f90704a6377c0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/prompt.txt b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f1098275abcac9639a1413036c290f24cb10869 --- /dev/null +++ b/VBVR-Dataset/glass_refraction_task/glass_refraction_00000002/prompt.txt @@ -0,0 +1 @@ +A light ray enters glass from air. The glass refractive index is 1.76, and the incident angle is 53.5 degrees. Using Snell's law, predict how the light ray refracts as it enters the glass. Draw the refracted ray from the point where the incident ray hits the glass surface, extending to the image edge. Show the complete refracted ray path inside the glass. \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/final_frame.png b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e8aeb6631fa14b91635e307b16007ba1e3132a20 Binary files /dev/null and b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/first_frame.png b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e36b6f252285b9a7808c8059ac1e9aba728df53c Binary files /dev/null and b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ba5452b1928e9960693e0e4538ee3e3e07be4943 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb7547a56fb92ce1514a08423440a9e5edaffe336a5bbb5b466dbf67442d09f +size 637543 diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/metadata.json b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe7189bae2ef83c24a36ce872127857575d8142 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/metadata.json @@ -0,0 +1,67 @@ +{ + "task_id": "grid_avoid_obstacles_00000000", + "generator": "grid_avoid_obstacles", + "timestamp": "2026-02-17T06:56:31.037657", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "obstacles": [ + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 1, + 9 + ], + [ + 2, + 5 + ], + [ + 4, + 7 + ], + [ + 4, + 9 + ], + [ + 5, + 2 + ], + [ + 6, + 1 + ], + [ + 6, + 2 + ], + [ + 8, + 9 + ] + ] + }, + "param_hash": "5576639e94646752", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/prompt.txt b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b29aa83c812e61c71bbad69fb5554e16d1bb67b --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a blue start square (containing a yellow circular agent), a red end square, and multiple black X marks indicating obstacles. Starting from the blue start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path without entering any cells marked with black X obstacles. \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/final_frame.png b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bbb8c3178644ec831ecd10e66cfb11d3e8123efe Binary files /dev/null and b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/first_frame.png b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..abdf59ace188cb86380c2a150400c5b1d857e64f Binary files /dev/null and b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8aed4db06147f408e85155745093dee1b0630c95 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb267f7828ed2f2432253191fb4c7340bb8bfdd9b0a94f2989ba43309404b69 +size 652231 diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/metadata.json b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8da7974831b4ef6d17360a87d97e6718d32136e9 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "grid_avoid_obstacles_00000001", + "generator": "grid_avoid_obstacles", + "timestamp": "2026-02-17T06:56:31.830650", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 9, + 5 + ], + "obstacles": [ + [ + 1, + 2 + ], + [ + 2, + 5 + ], + [ + 3, + 5 + ], + [ + 4, + 0 + ], + [ + 5, + 6 + ], + [ + 5, + 7 + ], + [ + 5, + 8 + ], + [ + 6, + 7 + ], + [ + 7, + 9 + ], + [ + 9, + 7 + ], + [ + 9, + 9 + ] + ] + }, + "param_hash": "fb7886bf36721f71", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/prompt.txt b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b29aa83c812e61c71bbad69fb5554e16d1bb67b --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a blue start square (containing a yellow circular agent), a red end square, and multiple black X marks indicating obstacles. Starting from the blue start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path without entering any cells marked with black X obstacles. \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/final_frame.png b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e528102781460b969f2c8c01b584e6f92d752d0b Binary files /dev/null and b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/first_frame.png b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..75f827c0b1357399f82acf534066baabe1235299 Binary files /dev/null and b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..611c505037cb811c639393b7f267365eea3a471a --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f5bc6850102e9c378986a26fd277f4badb15bd1891af50a4b15deb8758cec39 +size 680099 diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/metadata.json b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..cd2624ac16f104d5084425193cd9161b51159d7a --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/metadata.json @@ -0,0 +1,51 @@ +{ + "task_id": "grid_avoid_obstacles_00000002", + "generator": "grid_avoid_obstacles", + "timestamp": "2026-02-17T06:56:32.741950", + "parameters": { + "start": [ + 8, + 5 + ], + "end": [ + 0, + 8 + ], + "obstacles": [ + [ + 0, + 5 + ], + [ + 1, + 0 + ], + [ + 4, + 7 + ], + [ + 5, + 3 + ], + [ + 6, + 7 + ], + [ + 7, + 3 + ] + ] + }, + "param_hash": "49d8b31c0e64076f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/prompt.txt b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b29aa83c812e61c71bbad69fb5554e16d1bb67b --- /dev/null +++ b/VBVR-Dataset/grid_avoid_obstacles_task/grid_avoid_obstacles_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a blue start square (containing a yellow circular agent), a red end square, and multiple black X marks indicating obstacles. Starting from the blue start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path without entering any cells marked with black X obstacles. \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/final_frame.png b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..df2813066bbb70f0de5f89b720664276704820fc Binary files /dev/null and b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/first_frame.png b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..63f38194151fa1687febdcc67cc8a8d4e28f683f Binary files /dev/null and b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..1564659549e5dba6b98840b88cb729c7e157058a --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd483ec527aeddf9de0243ba14e67255dde444a4b3c59fa4eb377652508503b8 +size 547328 diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/metadata.json b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7cdfb127ff16e425cb2f0380fa6dbbc05bb17776 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/metadata.json @@ -0,0 +1,67 @@ +{ + "task_id": "grid_avoid_red_block_00000000", + "generator": "grid_avoid_red_block", + "timestamp": "2026-02-17T07:03:13.443411", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "obstacles": [ + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 1, + 9 + ], + [ + 2, + 5 + ], + [ + 4, + 7 + ], + [ + 4, + 9 + ], + [ + 5, + 2 + ], + [ + 6, + 1 + ], + [ + 6, + 2 + ], + [ + 8, + 9 + ] + ] + }, + "param_hash": "5576639e94646752", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/prompt.txt b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb5dbb7a7676f87ee522a321d7a598b0f86af246 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a blue start square (containing a yellow circular agent), a green end square, and multiple red filled rectangles indicating obstacles. Starting from the blue start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the green end square along the shortest path without entering any cells containing red filled rectangles. \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/final_frame.png b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c45411ae085e6b08eceec38ce0cea6d9d9bc1a3e Binary files /dev/null and b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/first_frame.png b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0c71959706ff484f9e88bc0caaa36973ec602090 Binary files /dev/null and b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..fdfbd3e07d158963ef8091bc3bc952f5208b155b --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18aaac5c0886477924b29cc8645534ff619117a63ee4d1a88b8ac8eb62040237 +size 553591 diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/metadata.json b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fd32da050dd99eb7f0ead339333ada79dcb79b4e --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "grid_avoid_red_block_00000001", + "generator": "grid_avoid_red_block", + "timestamp": "2026-02-17T07:03:14.234401", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 9, + 5 + ], + "obstacles": [ + [ + 1, + 2 + ], + [ + 2, + 5 + ], + [ + 3, + 5 + ], + [ + 4, + 0 + ], + [ + 5, + 6 + ], + [ + 5, + 7 + ], + [ + 5, + 8 + ], + [ + 6, + 7 + ], + [ + 7, + 9 + ], + [ + 9, + 7 + ], + [ + 9, + 9 + ] + ] + }, + "param_hash": "fb7886bf36721f71", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/prompt.txt b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb5dbb7a7676f87ee522a321d7a598b0f86af246 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a blue start square (containing a yellow circular agent), a green end square, and multiple red filled rectangles indicating obstacles. Starting from the blue start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the green end square along the shortest path without entering any cells containing red filled rectangles. \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/final_frame.png b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1f4e34e582d3f007d34aa97d3259f95fe86f8df4 Binary files /dev/null and b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/first_frame.png b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..662356f0435fb0062ea600bc165fc5955d310540 Binary files /dev/null and b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a0e2ec2cc1400d63f93e943ba5c5c1ad0dabc8ec --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff04ae9966319d4780a3d203a95c5d54a0b6d1f8a67bc3c4b492b0460c4cc8f +size 626679 diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/metadata.json b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..11114a911cd2d29827cbe70c230278ec60780209 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/metadata.json @@ -0,0 +1,51 @@ +{ + "task_id": "grid_avoid_red_block_00000002", + "generator": "grid_avoid_red_block", + "timestamp": "2026-02-17T07:03:15.130977", + "parameters": { + "start": [ + 8, + 5 + ], + "end": [ + 0, + 8 + ], + "obstacles": [ + [ + 0, + 5 + ], + [ + 1, + 0 + ], + [ + 4, + 7 + ], + [ + 5, + 3 + ], + [ + 6, + 7 + ], + [ + 7, + 3 + ] + ] + }, + "param_hash": "49d8b31c0e64076f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/prompt.txt b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb5dbb7a7676f87ee522a321d7a598b0f86af246 --- /dev/null +++ b/VBVR-Dataset/grid_avoid_red_block_task/grid_avoid_red_block_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a blue start square (containing a yellow circular agent), a green end square, and multiple red filled rectangles indicating obstacles. Starting from the blue start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the green end square along the shortest path without entering any cells containing red filled rectangles. \ No newline at end of file diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/final_frame.png b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e1f60aed4a0d8cccc7512d35fba73a1beff0ef61 Binary files /dev/null and b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/first_frame.png b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f2defa60e923a2aa2426c81c2f4f39e736216d28 Binary files /dev/null and b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d28cf59db5ebf0d80d8ecf214a7565ec3e351377 --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbaa375b6acae8b23e2e98246de082fb6d906220b2e518d37e0fbd5d1f78250c +size 528182 diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/metadata.json b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5ab9628392ebf72141b5f55d8dbcdee7da26c0dc --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/metadata.json @@ -0,0 +1,63 @@ +{ + "task_id": "grid_color_sequence_00000000", + "generator": "grid_color_sequence", + "timestamp": "2026-02-17T06:55:40.569461", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "color_stops": [ + { + "order": 1, + "position": [ + 4, + 7 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "order": 2, + "position": [ + 5, + 2 + ], + "color": [ + 255, + 255, + 0 + ] + }, + { + "order": 3, + "position": [ + 6, + 1 + ], + "color": [ + 255, + 165, + 0 + ] + } + ] + }, + "param_hash": "f3ddefd161c4e678", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/prompt.txt b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc09d39338f47a8530bb579462d159057933a23a --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and colored cells (blue, yellow, and orange). A purple circular agent is positioned at the green start point. The agent can move to adjacent cells (up, down, left, right). Starting from the green start point, the agent must visit the colored cells in order (blue, then yellow, then orange), taking the shortest path between each consecutive pair of colored cells. The agent is allowed to pass through the red end point when visiting the colored cells if needed. After visiting all colored cells in sequence, the agent must reach the red end point, also following the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/final_frame.png b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2c4c413a6bd13096a6d4f4c42e243ab6926c4b2d Binary files /dev/null and b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/first_frame.png b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9c9fc0234d8bdcff1865f52c32c33af922690fa4 Binary files /dev/null and b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..299aa0e08325f16d05e0819372e5773df5c3cc15 --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708b92b0f74734c666488fd0921667bbf4018795d906dba34d742622b4b31fc9 +size 539898 diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/metadata.json b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..009afd4f75fa7b1614b8d7e77734b56e1a6358b9 --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/metadata.json @@ -0,0 +1,63 @@ +{ + "task_id": "grid_color_sequence_00000001", + "generator": "grid_color_sequence", + "timestamp": "2026-02-17T06:55:41.501641", + "parameters": { + "start": [ + 1, + 9 + ], + "end": [ + 8, + 9 + ], + "color_stops": [ + { + "order": 1, + "position": [ + 4, + 9 + ], + "color": [ + 255, + 165, + 0 + ] + }, + { + "order": 2, + "position": [ + 0, + 2 + ], + "color": [ + 255, + 255, + 0 + ] + }, + { + "order": 3, + "position": [ + 0, + 1 + ], + "color": [ + 0, + 0, + 255 + ] + } + ] + }, + "param_hash": "f31e3ef530ae8d70", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/prompt.txt b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..54f5ca229bc2af7c962a08b3df1e15bbb0ca52c6 --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and colored cells (orange, yellow, and blue). A purple circular agent is positioned at the green start point. The agent can move to adjacent cells (up, down, left, right). Starting from the green start point, the agent must visit the colored cells in order (orange, then yellow, then blue), taking the shortest path between each consecutive pair of colored cells. The agent is allowed to pass through the red end point when visiting the colored cells if needed. After visiting all colored cells in sequence, the agent must reach the red end point, also following the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/final_frame.png b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..83c12c28c80c9408040ba4d7dea3d3fa28dd3693 Binary files /dev/null and b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/first_frame.png b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4ad3444b612c25129f17316b5111f72c2c4049ae Binary files /dev/null and b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..444fc3e4f1323639077371b9f13ecfe635c672b5 --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b4789a540e60cd4af109337731d22385972ef4ee5ea2ed484f2eba03df8d35 +size 519134 diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/metadata.json b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9c2736e305c75cd39662ec37bcb3488da78ae0f0 --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/metadata.json @@ -0,0 +1,63 @@ +{ + "task_id": "grid_color_sequence_00000002", + "generator": "grid_color_sequence", + "timestamp": "2026-02-17T06:55:42.433998", + "parameters": { + "start": [ + 6, + 2 + ], + "end": [ + 0, + 3 + ], + "color_stops": [ + { + "order": 1, + "position": [ + 6, + 9 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "order": 2, + "position": [ + 7, + 3 + ], + "color": [ + 255, + 255, + 0 + ] + }, + { + "order": 3, + "position": [ + 5, + 1 + ], + "color": [ + 255, + 165, + 0 + ] + } + ] + }, + "param_hash": "daab9f45ae0ba709", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/prompt.txt b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..dc09d39338f47a8530bb579462d159057933a23a --- /dev/null +++ b/VBVR-Dataset/grid_color_sequence_task/grid_color_sequence_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and colored cells (blue, yellow, and orange). A purple circular agent is positioned at the green start point. The agent can move to adjacent cells (up, down, left, right). Starting from the green start point, the agent must visit the colored cells in order (blue, then yellow, then orange), taking the shortest path between each consecutive pair of colored cells. The agent is allowed to pass through the red end point when visiting the colored cells if needed. After visiting all colored cells in sequence, the agent must reach the red end point, also following the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/final_frame.png b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..177685ca1033704cf7417287015c0d95c10bd17d Binary files /dev/null and b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/first_frame.png b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6b67edebf9706b3d4565f684e94d25557a2ff19e Binary files /dev/null and b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2e4094e5c836e78b003de8e39a1b138090c8ab43 --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52923d863afbfc7b0e8c6ce5a18b52a265b1713cba62fee8c322561b55bbaf8a +size 633036 diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/metadata.json b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6c311d506e4b275292cb319832ce6c48e26f2c73 --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/metadata.json @@ -0,0 +1,66 @@ +{ + "task_id": "grid_go_through_block_00000000", + "generator": "grid_go_through_block", + "timestamp": "2026-02-17T07:02:06.667694", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "blocks": [ + { + "order": 1, + "position": [ + 4, + 7 + ], + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue" + }, + { + "order": 2, + "position": [ + 5, + 2 + ], + "color": [ + 255, + 255, + 0 + ], + "color_name": "yellow" + }, + { + "order": 3, + "position": [ + 6, + 1 + ], + "color": [ + 255, + 192, + 203 + ], + "color_name": "pink" + } + ] + }, + "param_hash": "e3ef64eccec3f833", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/prompt.txt b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f87c5470ca9af8dd6f45e76c1f9636c0d1781b6 --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start square (containing an orange circular agent), a red end square, and multiple blue, yellow and pink rectangular blocks. Starting from the green start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path that passes through all blue, yellow and pink blocks (the agent must visit every blue, yellow and pink block before reaching the red end square). \ No newline at end of file diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/final_frame.png b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ac97542bb82e1b65ff46c0d4d9eec6f91f301643 Binary files /dev/null and b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/first_frame.png b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a33d40cd6afe94cbaac58e65f34fac56d1bfce6c Binary files /dev/null and b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f8d061a8173b3834ae08759a5b3b071da43cfb1d --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf9613535c7610c3bbe9c807b9d417108ef3b42cf7b8877670597f0b36379116 +size 1125780 diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/metadata.json b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b2643002520a28aaeccd600a9a94aca4d5c7aba3 --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/metadata.json @@ -0,0 +1,66 @@ +{ + "task_id": "grid_go_through_block_00000001", + "generator": "grid_go_through_block", + "timestamp": "2026-02-17T07:02:08.444404", + "parameters": { + "start": [ + 9, + 0 + ], + "end": [ + 2, + 0 + ], + "blocks": [ + { + "order": 1, + "position": [ + 8, + 9 + ], + "color": [ + 128, + 0, + 128 + ], + "color_name": "purple" + }, + { + "order": 2, + "position": [ + 6, + 2 + ], + "color": [ + 128, + 0, + 128 + ], + "color_name": "purple" + }, + { + "order": 3, + "position": [ + 0, + 3 + ], + "color": [ + 255, + 192, + 203 + ], + "color_name": "pink" + } + ] + }, + "param_hash": "1734ee9a08e52d22", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/prompt.txt b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..69369ae969db34d9a004a2c4b4e32a2881371197 --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start square (containing an orange circular agent), a red end square, and multiple purple and pink rectangular blocks. Starting from the green start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path that passes through all purple and pink blocks (the agent must visit every purple and pink block before reaching the red end square). \ No newline at end of file diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/final_frame.png b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d563d3f16c58169e3062a362056470b5e7cdb7e4 Binary files /dev/null and b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/first_frame.png b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..342df03f7972abff567f87f43c90c0f9058c95ee Binary files /dev/null and b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..9df72d6b220865c6df055cf5e05d7b7a394ea6cb --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:290293c3d8cef69e884f0d6f52b07b0bcecbd434ee99b92bdf161cec370d69b5 +size 930393 diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/metadata.json b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..546e84a133c7b626498bbf3b39bca5671be03ffd --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "grid_go_through_block_00000002", + "generator": "grid_go_through_block", + "timestamp": "2026-02-17T07:02:09.846462", + "parameters": { + "start": [ + 5, + 1 + ], + "end": [ + 2, + 7 + ], + "blocks": [ + { + "order": 1, + "position": [ + 5, + 5 + ], + "color": [ + 255, + 192, + 203 + ], + "color_name": "pink" + }, + { + "order": 2, + "position": [ + 8, + 5 + ], + "color": [ + 128, + 0, + 128 + ], + "color_name": "purple" + }, + { + "order": 3, + "position": [ + 5, + 5 + ], + "color": [ + 255, + 192, + 203 + ], + "color_name": "pink" + }, + { + "order": 4, + "position": [ + 0, + 2 + ], + "color": [ + 128, + 0, + 128 + ], + "color_name": "purple" + } + ] + }, + "param_hash": "a6d7939ba8ad2f67", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/prompt.txt b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..69369ae969db34d9a004a2c4b4e32a2881371197 --- /dev/null +++ b/VBVR-Dataset/grid_go_through_block_task/grid_go_through_block_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start square (containing an orange circular agent), a red end square, and multiple purple and pink rectangular blocks. Starting from the green start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path that passes through all purple and pink blocks (the agent must visit every purple and pink block before reaching the red end square). \ No newline at end of file diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/final_frame.png b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ce20f7863397d6cf253daf24d44d0665afe65f60 Binary files /dev/null and b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/first_frame.png b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f7e4644e5795574cdfac48f5e917234bd03b06ee Binary files /dev/null and b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d090d27f6ce8317fd4fa850226bec40e6273400d --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27944674e23fe6b66c8136ee9c1aac39d8dacaf39ab9bf513cb385605143222c +size 805395 diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/metadata.json b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3d85891655247fe980face7670af33187c1d3c18 --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/metadata.json @@ -0,0 +1,105 @@ +{ + "task_id": "grid_highest_cost_00000000", + "generator": "grid_highest_cost", + "timestamp": "2026-02-26T09:53:54.974933", + "parameters": { + "grid": [ + [ + 20, + 50, + 10, + 10 + ], + [ + 50, + 30, + 30, + 40 + ], + [ + 30, + 20, + 40, + 10 + ], + [ + 10, + 50, + 50, + 50 + ] + ], + "path": [ + [ + 0, + 0 + ], + [ + 1, + 0 + ], + [ + 2, + 0 + ], + [ + 3, + 0 + ], + [ + 3, + 1 + ], + [ + 2, + 1 + ], + [ + 1, + 1 + ], + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 1, + 2 + ], + [ + 1, + 3 + ], + [ + 2, + 3 + ], + [ + 2, + 2 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ] + ] + }, + "param_hash": "3a9953725c3d70d2", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/prompt.txt b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..7639d04abdad3e84cdb5aac79636b1006424c781 --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 4x4 grid with cost values displayed in each cell, a green start cell (containing a yellow Pac-Man agent) at the top-left, and a red goal cell at the bottom-right. Starting from the green start cell, the agent can move to adjacent cells (up, down, left, right) one step at a time. Move the agent to the red goal cell along the path with the highest total cost (the sum of all cost values of cells visited along the path), showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/final_frame.png b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..60fc3af34ea31995b806ea091101ef8d5b381d02 Binary files /dev/null and b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/first_frame.png b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7b115b45adae1da2e482b380465c18b3539edadc Binary files /dev/null and b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4f87d537ba4bfb089d0124f1dba3b65aaa0ef20d --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b27b8bb1c87d65d68e8c543fdd2b480cf36f42b6cd4123f575b856db28dc48e +size 805275 diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/metadata.json b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bc31ffda3f88fca11a07fac3064c5b2bfc8cb09d --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/metadata.json @@ -0,0 +1,105 @@ +{ + "task_id": "grid_highest_cost_00000001", + "generator": "grid_highest_cost", + "timestamp": "2026-02-26T09:53:55.667736", + "parameters": { + "grid": [ + [ + 20, + 30, + 30, + 50 + ], + [ + 10, + 20, + 10, + 10 + ], + [ + 40, + 20, + 10, + 20 + ], + [ + 50, + 50, + 30, + 40 + ] + ], + "path": [ + [ + 0, + 0 + ], + [ + 1, + 0 + ], + [ + 2, + 0 + ], + [ + 3, + 0 + ], + [ + 3, + 1 + ], + [ + 2, + 1 + ], + [ + 1, + 1 + ], + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 0, + 3 + ], + [ + 1, + 3 + ], + [ + 2, + 3 + ], + [ + 2, + 2 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ] + ] + }, + "param_hash": "f940d337de0c4e67", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/prompt.txt b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..7639d04abdad3e84cdb5aac79636b1006424c781 --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 4x4 grid with cost values displayed in each cell, a green start cell (containing a yellow Pac-Man agent) at the top-left, and a red goal cell at the bottom-right. Starting from the green start cell, the agent can move to adjacent cells (up, down, left, right) one step at a time. Move the agent to the red goal cell along the path with the highest total cost (the sum of all cost values of cells visited along the path), showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/final_frame.png b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9f2a2b532d60a060780b241aa70a78b72f8c23fc Binary files /dev/null and b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/first_frame.png b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d8c31fba0db1dca0d778389fcdfcf63cc884de86 Binary files /dev/null and b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..84929e08f7831e795a6f5f560474afd64b49ba6e --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5ffabbb9679b44bff70914e48aa332803c493a0933916b5069ab0df2f74fa3 +size 812629 diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/metadata.json b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8680769c98d38f74b6304866c96e86806bde64ea --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/metadata.json @@ -0,0 +1,105 @@ +{ + "task_id": "grid_highest_cost_00000002", + "generator": "grid_highest_cost", + "timestamp": "2026-02-26T09:53:56.354629", + "parameters": { + "grid": [ + [ + 50, + 40, + 20, + 30 + ], + [ + 10, + 20, + 40, + 50 + ], + [ + 30, + 10, + 20, + 30 + ], + [ + 30, + 50, + 30, + 40 + ] + ], + "path": [ + [ + 0, + 0 + ], + [ + 1, + 0 + ], + [ + 2, + 0 + ], + [ + 3, + 0 + ], + [ + 3, + 1 + ], + [ + 3, + 2 + ], + [ + 2, + 2 + ], + [ + 1, + 2 + ], + [ + 1, + 1 + ], + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 0, + 3 + ], + [ + 1, + 3 + ], + [ + 2, + 3 + ], + [ + 3, + 3 + ] + ] + }, + "param_hash": "d8664e256ad3d8b7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/prompt.txt b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..7639d04abdad3e84cdb5aac79636b1006424c781 --- /dev/null +++ b/VBVR-Dataset/grid_highest_cost_task/grid_highest_cost_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 4x4 grid with cost values displayed in each cell, a green start cell (containing a yellow Pac-Man agent) at the top-left, and a red goal cell at the bottom-right. Starting from the green start cell, the agent can move to adjacent cells (up, down, left, right) one step at a time. Move the agent to the red goal cell along the path with the highest total cost (the sum of all cost values of cells visited along the path), showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/._first_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/._first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e9684277dd5053c485623729eaaa6661c501aada Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/._first_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/._ground_truth.mp4 b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/._ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0b31d68e9339857972ed69a8da6fbb794b85682f Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/._ground_truth.mp4 differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/final_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b5f089f7007a22af027a73d1d579c3ce43a6ef87 Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/first_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..803320c0cf0d58056c2f2bf0416c1a0ad2263c12 Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cbd54b750a536cd4d183e14f254d2e0bf05d9697 --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a726933364b19d65a70ad06363a1fee7331d963692f7d8c1fa9c9031d3c89d42 +size 554484 diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/metadata.json b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6f982e246ae8a95d0303e647480bd96bd7d8d14c --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/metadata.json @@ -0,0 +1,48 @@ +{ + "task_id": "grid_number_sequence_00000000", + "generator": "grid_number_sequence", + "timestamp": "2026-02-26T07:28:36.191681", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "number_positions": [ + { + "number": 1, + "position": [ + 8, + 5 + ] + }, + { + "number": 2, + "position": [ + 4, + 7 + ] + }, + { + "number": 3, + "position": [ + 5, + 2 + ] + } + ] + }, + "param_hash": "c69950f62a0c5b5b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/prompt.txt b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7cacbd86285ff0f522c4a1f4bec8c28c58d12ef --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and yellow cells marked with numbers 1, 2, and 3. An orange circular agent is positioned at the green start point. The agent can move to adjacent cells (up, down, left, right). Starting from the green start point, the agent must visit the numbered yellow cells in numerical order (1, then 2, then 3), taking the shortest path between each consecutive pair of numbered cells. The agent is allowed to pass through the red end point when visiting the numbered cells if needed. After visiting all numbered cells in sequence, the agent must reach the red end point, also following the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/final_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f2f1e8eef66c57ffa67f4c05cfbcac7f6f6d7954 Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/first_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f6346482acd3d18cdb2943ccc17d081fe5fa6777 Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..44ad95b40fc551c1fe837148ddef1651d2da37fe --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ef351311b04298e10298ad3dbc51c8908a7312616b26b363c526085e6c8c69 +size 567936 diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/metadata.json b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1a7d0589f1f2ea8eb8c45804c16de89e4f32f8fa --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/metadata.json @@ -0,0 +1,48 @@ +{ + "task_id": "grid_number_sequence_00000001", + "generator": "grid_number_sequence", + "timestamp": "2026-02-26T07:28:37.172767", + "parameters": { + "start": [ + 6, + 1 + ], + "end": [ + 1, + 9 + ], + "number_positions": [ + { + "number": 1, + "position": [ + 8, + 9 + ] + }, + { + "number": 2, + "position": [ + 2, + 5 + ] + }, + { + "number": 3, + "position": [ + 4, + 9 + ] + } + ] + }, + "param_hash": "635561f8c5c80369", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/prompt.txt b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7cacbd86285ff0f522c4a1f4bec8c28c58d12ef --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and yellow cells marked with numbers 1, 2, and 3. An orange circular agent is positioned at the green start point. The agent can move to adjacent cells (up, down, left, right). Starting from the green start point, the agent must visit the numbered yellow cells in numerical order (1, then 2, then 3), taking the shortest path between each consecutive pair of numbered cells. The agent is allowed to pass through the red end point when visiting the numbered cells if needed. After visiting all numbered cells in sequence, the agent must reach the red end point, also following the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/final_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9e98edc08f7c977aa0aa39cc55e38ee087412d2c Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/first_frame.png b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1e24c4a9c0f71d4f849f806cee5383f1c6f8242b Binary files /dev/null and b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3a40b5942e996f64052220fe97ad560c7925e3f1 --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd44f2aa9861ddc2a72e7a0dc093168d1976f45a25ef3cefa9f9f1b491558c9f +size 752017 diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/metadata.json b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..eda84da0bdac1f50ec5fe5cb6a42fab20d88dd7d --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/metadata.json @@ -0,0 +1,48 @@ +{ + "task_id": "grid_number_sequence_00000002", + "generator": "grid_number_sequence", + "timestamp": "2026-02-26T07:28:38.578990", + "parameters": { + "start": [ + 0, + 2 + ], + "end": [ + 0, + 1 + ], + "number_positions": [ + { + "number": 1, + "position": [ + 6, + 2 + ] + }, + { + "number": 2, + "position": [ + 0, + 3 + ] + }, + { + "number": 3, + "position": [ + 8, + 9 + ] + } + ] + }, + "param_hash": "a165971d5092ef99", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/prompt.txt b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7cacbd86285ff0f522c4a1f4bec8c28c58d12ef --- /dev/null +++ b/VBVR-Dataset/grid_number_sequence_task/grid_number_sequence_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and yellow cells marked with numbers 1, 2, and 3. An orange circular agent is positioned at the green start point. The agent can move to adjacent cells (up, down, left, right). Starting from the green start point, the agent must visit the numbered yellow cells in numerical order (1, then 2, then 3), taking the shortest path between each consecutive pair of numbered cells. The agent is allowed to pass through the red end point when visiting the numbered cells if needed. After visiting all numbered cells in sequence, the agent must reach the red end point, also following the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/final_frame.png b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e880d79dcdf08ce3168a9c5e888cea2bc0829e6f Binary files /dev/null and b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/first_frame.png b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4cfdd1fe3bfafb98d425a120ad557660204847c9 Binary files /dev/null and b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c5d3ddd26418a344696b7135c23ac99d2943b91e --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffd7d51d88d3de04cb85fc4a1e36efa0dbdafd8d6142e296987fceec69696e14 +size 628137 diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/metadata.json b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..28cd96c8651e15264d16043531273f91d5843168 --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/metadata.json @@ -0,0 +1,82 @@ +{ + "task_id": "grid_obtaining_award_00000000", + "generator": "grid_obtaining_award", + "timestamp": "2026-02-17T06:47:58.958956", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "rewards": [ + { + "id": 0, + "position": [ + 6, + 1 + ], + "color": [ + 150, + 255, + 200 + ] + }, + { + "id": 1, + "position": [ + 1, + 9 + ], + "color": [ + 100, + 200, + 255 + ] + }, + { + "id": 2, + "position": [ + 4, + 7 + ], + "color": [ + 200, + 255, + 255 + ] + }, + { + "id": 3, + "position": [ + 5, + 2 + ], + "color": [ + 255, + 100, + 100 + ] + } + ], + "shape": "circle", + "reward_order": [ + 1, + 2, + 3, + 0 + ] + }, + "param_hash": "65ba1254ad124ba6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/prompt.txt b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2075493726d28e9d4a0066a38c9780d8ddfc6044 --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and 4 circle reward items scattered across it. A circular agent starts at the green start point and can move to adjacent cells (up, down, left, right). The agent collects a reward by moving to its cell, and once collected, the reward disappears. Find the shortest path that collects all 4 circle rewards before reaching the red end point. \ No newline at end of file diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/final_frame.png b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1491cf2d84d83a1b6d146e4ab6514402dfb0c7e2 Binary files /dev/null and b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/first_frame.png b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2e4397c28e3653f2eaa7027def3bfb8e2f797a46 Binary files /dev/null and b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..9c27cad49bac2abe5d8c077b8abe46621a7546a1 --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b6ca16e5f45bd161609cf89f2182241dedf35de0fa8f38d8cc52288cecd61d +size 542645 diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/metadata.json b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f786e1cf3113ebfa5150695932d7cd61be89ba5b --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/metadata.json @@ -0,0 +1,69 @@ +{ + "task_id": "grid_obtaining_award_00000001", + "generator": "grid_obtaining_award", + "timestamp": "2026-02-17T06:48:00.135982", + "parameters": { + "start": [ + 2, + 0 + ], + "end": [ + 1, + 6 + ], + "rewards": [ + { + "id": 0, + "position": [ + 8, + 9 + ], + "color": [ + 200, + 150, + 255 + ] + }, + { + "id": 1, + "position": [ + 0, + 3 + ], + "color": [ + 180, + 255, + 100 + ] + }, + { + "id": 2, + "position": [ + 5, + 6 + ], + "color": [ + 200, + 255, + 150 + ] + } + ], + "shape": "star", + "reward_order": [ + 1, + 2, + 0 + ] + }, + "param_hash": "00be1c0ae85df61d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/prompt.txt b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..129520adb4a0b2aeb8007e71dd125e8a8a9adc86 --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and 3 star reward items scattered across it. A circular agent starts at the green start point and can move to adjacent cells (up, down, left, right). The agent collects a reward by moving to its cell, and once collected, the reward disappears. Find the shortest path that collects all 3 star rewards before reaching the red end point. \ No newline at end of file diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/final_frame.png b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7351ae5df0dc0a2c5d6231f0e8dafcb055a11cc5 Binary files /dev/null and b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/first_frame.png b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..13ef39bc1f6b9f26393c9df7c40905e35445d183 Binary files /dev/null and b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a566f064ec763880f283b4fd6ec0a51ada13f0c6 --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961d19a0074c3ae1139e444ba88933c1a521e02a72a03f2ef6508889e20eb211 +size 545177 diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/metadata.json b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..c0549d36d482504fe85b7089f264bfe044b1b03c --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/metadata.json @@ -0,0 +1,82 @@ +{ + "task_id": "grid_obtaining_award_00000002", + "generator": "grid_obtaining_award", + "timestamp": "2026-02-17T06:48:01.251559", + "parameters": { + "start": [ + 1, + 2 + ], + "end": [ + 7, + 9 + ], + "rewards": [ + { + "id": 0, + "position": [ + 0, + 2 + ], + "color": [ + 255, + 255, + 200 + ] + }, + { + "id": 1, + "position": [ + 5, + 5 + ], + "color": [ + 200, + 255, + 255 + ] + }, + { + "id": 2, + "position": [ + 8, + 5 + ], + "color": [ + 180, + 100, + 255 + ] + }, + { + "id": 3, + "position": [ + 6, + 5 + ], + "color": [ + 180, + 180, + 255 + ] + } + ], + "shape": "star", + "reward_order": [ + 0, + 1, + 3, + 2 + ] + }, + "param_hash": "c27dd37beebbdf71", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/prompt.txt b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..42d55f2d70709efc3fe14b6c3fdd6926b36dd359 --- /dev/null +++ b/VBVR-Dataset/grid_obtaining_award_task/grid_obtaining_award_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start point, a red end point, and 4 star reward items scattered across it. A circular agent starts at the green start point and can move to adjacent cells (up, down, left, right). The agent collects a reward by moving to its cell, and once collected, the reward disappears. Find the shortest path that collects all 4 star rewards before reaching the red end point. \ No newline at end of file diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000000/final_frame.png b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9ad04918f6efa4138779b19a74a85c9890f0fafa Binary files /dev/null and b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000000/first_frame.png b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9e67d879afc2fe5c53a1a303a9cccebb1de8dbbd Binary files /dev/null and b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..07fc4dacaa956ba9cf811463147eb4b636b0d14b --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88b4c86662abfa9e8b6946151c8002663dc6856c9ed4e5eb956d46e9b46e034 +size 837411 diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000000/metadata.json b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8cc117fdacce6bd1d088c4e01d1cc357fd64d0d9 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/metadata.json @@ -0,0 +1,182 @@ +{ + "task_id": "grid_shift_00000000", + "generator": "grid_shift", + "timestamp": "2026-02-17T07:49:47.800752", + "parameters": { + "grid_size": 7, + "direction": "up", + "steps": 3, + "color": [ + 0, + 123, + 255 + ], + "color_name": "blue", + "initial_positions": [ + [ + 5, + 3 + ], + [ + 5, + 6 + ], + [ + 6, + 4 + ], + [ + 4, + 3 + ], + [ + 4, + 2 + ], + [ + 5, + 0 + ], + [ + 4, + 4 + ], + [ + 3, + 5 + ], + [ + 4, + 5 + ], + [ + 3, + 3 + ], + [ + 5, + 4 + ], + [ + 5, + 2 + ], + [ + 3, + 4 + ], + [ + 6, + 5 + ], + [ + 5, + 1 + ], + [ + 6, + 2 + ], + [ + 3, + 0 + ], + [ + 3, + 2 + ], + [ + 6, + 0 + ] + ], + "final_positions": [ + [ + 2, + 3 + ], + [ + 2, + 6 + ], + [ + 3, + 4 + ], + [ + 1, + 3 + ], + [ + 1, + 2 + ], + [ + 2, + 0 + ], + [ + 1, + 4 + ], + [ + 0, + 5 + ], + [ + 1, + 5 + ], + [ + 0, + 3 + ], + [ + 2, + 4 + ], + [ + 2, + 2 + ], + [ + 0, + 4 + ], + [ + 3, + 5 + ], + [ + 2, + 1 + ], + [ + 3, + 2 + ], + [ + 0, + 0 + ], + [ + 0, + 2 + ], + [ + 3, + 0 + ] + ] + }, + "param_hash": "30cd8319b3ad913c", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000000/prompt.txt b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7e863067e4d3e65a10f9cd0d0939440351b0b08 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 7x7 grid with 19 blue square blocks, each with a black outline, positioned at various locations. All blocks must move simultaneously upward by exactly 3 steps. Each block shifts one grid cell per step toward the top, and all blocks must remain within the grid boundaries throughout the movement. After the movement, all blocks should be positioned exactly 3 steps upward from their original positions. \ No newline at end of file diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000001/final_frame.png b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ff8e7a69eada0aa6913037468fa6ed0dd8ab4d5a Binary files /dev/null and b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000001/first_frame.png b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..efe7942c3174acc64263716ed86b3bf222297c69 Binary files /dev/null and b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c5a6dfd05ebbf836486e9a94240cbb9fbdb945c3 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddaea455f26c2801d51cde78a9ad8c96e2fc919e02907cc2e931bb6f1a6dad7 +size 411671 diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000001/metadata.json b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b27ec3eb3917f777c8ea360570998bec9b13648e --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/metadata.json @@ -0,0 +1,118 @@ +{ + "task_id": "grid_shift_00000001", + "generator": "grid_shift", + "timestamp": "2026-02-17T07:49:48.185526", + "parameters": { + "grid_size": 10, + "direction": "up", + "steps": 3, + "color": [ + 255, + 0, + 255 + ], + "color_name": "magenta", + "initial_positions": [ + [ + 7, + 2 + ], + [ + 8, + 1 + ], + [ + 8, + 9 + ], + [ + 5, + 6 + ], + [ + 7, + 4 + ], + [ + 3, + 9 + ], + [ + 4, + 8 + ], + [ + 6, + 0 + ], + [ + 6, + 9 + ], + [ + 4, + 6 + ], + [ + 8, + 4 + ] + ], + "final_positions": [ + [ + 4, + 2 + ], + [ + 5, + 1 + ], + [ + 5, + 9 + ], + [ + 2, + 6 + ], + [ + 4, + 4 + ], + [ + 0, + 9 + ], + [ + 1, + 8 + ], + [ + 3, + 0 + ], + [ + 3, + 9 + ], + [ + 1, + 6 + ], + [ + 5, + 4 + ] + ] + }, + "param_hash": "70362b79fc7a868a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000001/prompt.txt b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4463ac476fced36c9f1f23a30dcb527af92c3d54 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000001/prompt.txt @@ -0,0 +1 @@ +In the scene, there is a 10x10 grid with 11 magenta square blocks, each outlined in black, placed at different positions. Translate all blocks upward by exactly 3 steps, moving simultaneously and uniformly. Each block shifts 3 cells toward the top direction, and all blocks must remain completely within the grid boundaries. The goal is to achieve a configuration where every block has been moved exactly 3 steps upward to reach its final position. \ No newline at end of file diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000002/final_frame.png b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3a7d639c1cbf337ccc36eb6fb881bbc4754e72e1 Binary files /dev/null and b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000002/first_frame.png b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9b7a1a63f260219010b88c7b8962b894cd2e5332 Binary files /dev/null and b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c4883bb85d6e194b103cdcb5669b314201f87a14 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068eb8a2cdc208680c00b5486e2c7e027eaaac6b1d1f61f87f6a5f20a9611d47 +size 167471 diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000002/metadata.json b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..478789428195a5a5a19343e96f937dcaeb311a51 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/metadata.json @@ -0,0 +1,54 @@ +{ + "task_id": "grid_shift_00000002", + "generator": "grid_shift", + "timestamp": "2026-02-17T07:49:48.569646", + "parameters": { + "grid_size": 4, + "direction": "left", + "steps": 2, + "color": [ + 128, + 128, + 128 + ], + "color_name": "gray", + "initial_positions": [ + [ + 3, + 2 + ], + [ + 2, + 3 + ], + [ + 3, + 3 + ] + ], + "final_positions": [ + [ + 3, + 0 + ], + [ + 2, + 1 + ], + [ + 3, + 1 + ] + ] + }, + "param_hash": "bdc38cf41ef2025b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_shift_task/grid_shift_00000002/prompt.txt b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4455b249accea06e1c334efb6762933809be7603 --- /dev/null +++ b/VBVR-Dataset/grid_shift_task/grid_shift_00000002/prompt.txt @@ -0,0 +1 @@ +The scene displays a 4x4 grid containing 3 gray square blocks with black borders, distributed across different cells. Move every block leftward by precisely 2 steps. All blocks move together at the same time, shifting 2 grid cells in the left direction, and each block must stay within the grid's boundaries. The final configuration shows all blocks in their new positions, each exactly 2 steps leftward from where it started. \ No newline at end of file diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/final_frame.png b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..06f1e094ef10a979d2dcb82ef83ebac7e459bbb4 Binary files /dev/null and b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/final_frame.png differ diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/first_frame.png b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7cfbcceadfb0dc26ef74aa3f380fcdfb25820876 Binary files /dev/null and b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/first_frame.png differ diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/ground_truth.mp4 b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2f763486f83591570dec69ace2ee2ddf5075dfff --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7d26beb1dd49c808df9f7eaed7f49357cc90cd2cd0adfb13b9012d304c4d10 +size 563907 diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/metadata.json b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..73391c9cdf50bca4b3ec519ec1c106ac39ca9d7c --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/metadata.json @@ -0,0 +1,28 @@ +{ + "task_id": "grid_shortest_path_00000000", + "generator": "grid_shortest_path", + "timestamp": "2026-02-17T07:04:14.660104", + "parameters": { + "start": [ + 3, + 8 + ], + "end": [ + 1, + 1 + ], + "start_color": "#800080", + "end_color": "#FFFF00", + "agent_color": "#0000FF" + }, + "param_hash": "f258358791cfac6e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/prompt.txt b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..73ab69d56f4c1f98cf43444bdeb965eaab8b099c --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a purple start square (containing a blue circular agent) and a yellow end square. Starting from the purple start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the yellow end square along the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/final_frame.png b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3893ca4d1fab3d0445187f42fab8774f045c8526 Binary files /dev/null and b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/final_frame.png differ diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/first_frame.png b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..96be021a42c4e2172e5f2a714529bde183213175 Binary files /dev/null and b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/first_frame.png differ diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/ground_truth.mp4 b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3c4796ff85bb00b7ee04045dc86f5a7478a066a9 --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38bb0cdbe91f4e2c71f4f66a27fd0005d0c9dd3fd437a2650a617eb70c78213 +size 442722 diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/metadata.json b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6d84013135841222061703fabdf4f01a824aeb9f --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/metadata.json @@ -0,0 +1,28 @@ +{ + "task_id": "grid_shortest_path_00000001", + "generator": "grid_shortest_path", + "timestamp": "2026-02-17T07:04:15.267496", + "parameters": { + "start": [ + 7, + 5 + ], + "end": [ + 2, + 6 + ], + "start_color": "#FF0000", + "end_color": "#800080", + "agent_color": "#00FF00" + }, + "param_hash": "f5c433d7c373bf13", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/prompt.txt b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fcf06faa1a110e70f67a1541cb9f7b129f5a2ab5 --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a red start square (containing a green circular agent) and a purple end square. Starting from the red start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the purple end square along the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/final_frame.png b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5a678cd4d0dbfb7085e6f45228bff95e8e99bf36 Binary files /dev/null and b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/final_frame.png differ diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/first_frame.png b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2d9b0cc676838dd26f2f83b3308c126df2922db3 Binary files /dev/null and b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/first_frame.png differ diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/ground_truth.mp4 b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ee7cd5d69f501f6ae98b02c0c36e3110532e6e8d --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e82c5df94580bc80461083bf8a2d2646e3460774f6cc87e0bbdbd1f748b8105 +size 475197 diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/metadata.json b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..133684548a7ed7deaa5a6ae5ca0d951324c3f7d2 --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/metadata.json @@ -0,0 +1,28 @@ +{ + "task_id": "grid_shortest_path_00000002", + "generator": "grid_shortest_path", + "timestamp": "2026-02-17T07:04:15.984491", + "parameters": { + "start": [ + 5, + 4 + ], + "end": [ + 9, + 0 + ], + "start_color": "#00FF00", + "end_color": "#FF0000", + "agent_color": "#0000FF" + }, + "param_hash": "f9ef56ed6c63cbaf", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/prompt.txt b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..21449c4787cb51050cfa106da75846b8fd5075ef --- /dev/null +++ b/VBVR-Dataset/grid_shortest_path_task/grid_shortest_path_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a 10x10 grid with a green start square (containing a blue circular agent) and a red end square. Starting from the green start square, the agent can move to adjacent cells (up, down, left, right). The goal is to move the agent to the red end square along the shortest path. \ No newline at end of file diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/final_frame.png b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5edea48bf4b4c048ca37a2e3663ddfb78249461b Binary files /dev/null and b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/final_frame.png differ diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/first_frame.png b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5edea48bf4b4c048ca37a2e3663ddfb78249461b Binary files /dev/null and b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/first_frame.png differ diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/ground_truth.mp4 b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b15a79b915234638f937a2b8288a152eb89f783a --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92584db931910f0c8a8e2f2fe78fe69274671d614d4e7309af31bb460414c439 +size 225360 diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/metadata.json b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f0d05703fa9004f197969a05a39be02c6b70c8b7 --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/metadata.json @@ -0,0 +1,25 @@ +{ + "task_id": "handle_object_reappearance_00000000", + "generator": "handle_object_reappearance", + "timestamp": "2026-02-17T06:47:26.079213", + "parameters": { + "direction": "up", + "shape": "triangle", + "size": 180, + "color": [ + 177, + 64, + 58 + ] + }, + "param_hash": "f859a3e4c15a8148", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/prompt.txt b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3548b484105ddde0774f09e1495c89d333ded786 --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000000/prompt.txt @@ -0,0 +1 @@ +There is an object in the center. Move the object up off-screen, then return along the same path to the center. \ No newline at end of file diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/final_frame.png b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b0e09538ceda163c0df66171d7f4ca8598202ba9 Binary files /dev/null and b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/final_frame.png differ diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/first_frame.png b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b0e09538ceda163c0df66171d7f4ca8598202ba9 Binary files /dev/null and b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/first_frame.png differ diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/ground_truth.mp4 b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cedae8ae43e19a1606c0dbcb1e56932727f7c885 --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3524c714e90b7e440d513662b7d2ea9575d7e2c51898e5a97b2700c347e764c3 +size 170308 diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/metadata.json b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf89eed1107c7a8da4b25f7b048eaea7b2b6414 --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/metadata.json @@ -0,0 +1,25 @@ +{ + "task_id": "handle_object_reappearance_00000001", + "generator": "handle_object_reappearance", + "timestamp": "2026-02-17T06:47:26.975441", + "parameters": { + "direction": "left", + "shape": "diamond", + "size": 137, + "color": [ + 130, + 83, + 140 + ] + }, + "param_hash": "a842aa02fffa7b7d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/prompt.txt b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fb6425428230ac5a45b8dc0c4d85cfb75425c28f --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000001/prompt.txt @@ -0,0 +1 @@ +There is an object in the center. Move the object left off-screen, then return along the same path to the center. \ No newline at end of file diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/final_frame.png b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6ccc56823fa580a60f495e7227c91213258bd24d Binary files /dev/null and b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/final_frame.png differ diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/first_frame.png b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6ccc56823fa580a60f495e7227c91213258bd24d Binary files /dev/null and b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/first_frame.png differ diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/ground_truth.mp4 b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b14fe1860cbe61f6f0fdd4c685b40de4046c765b --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c2f25cf44a7e931a3c7124331ef215b9c163de68a7c31d292aeed7f4badd1f +size 139303 diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/metadata.json b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..12d51d1a55480999198f536bedb2788c26422a42 --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/metadata.json @@ -0,0 +1,25 @@ +{ + "task_id": "handle_object_reappearance_00000002", + "generator": "handle_object_reappearance", + "timestamp": "2026-02-17T06:47:27.844501", + "parameters": { + "direction": "right", + "shape": "square", + "size": 160, + "color": [ + 200, + 168, + 197 + ] + }, + "param_hash": "e71a72c65a0d1a8f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/prompt.txt b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a3c08960fab9ab91d541206ca0a4b92fcc5eff60 --- /dev/null +++ b/VBVR-Dataset/handle_object_reappearance_task/handle_object_reappearance_00000002/prompt.txt @@ -0,0 +1 @@ +There is an object in the center. Move the object right off-screen, then return along the same path to the center. \ No newline at end of file diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/final_frame.png b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..897dbb02bc93090ad78ba03320741772399a6cf3 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/final_frame.png differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/first_frame.png b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..74fb4d3d20582c2c2ce3b03fcb4f2a3ab678aeb6 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/first_frame.png differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/ground_truth.mp4 b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..dc897f506eb6f7d5d5f7dafac2ed3995bfa12e57 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/metadata.json b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..34b5418b19ed9dd57dca4c1fe6bd046f592a974a --- /dev/null +++ b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/metadata.json @@ -0,0 +1,75 @@ +{ + "task_id": "highlight_horizontal_lines_00000000", + "generator": "highlight_horizontal_lines", + "timestamp": "2026-02-17T07:00:04.864212", + "parameters": { + "lines": [ + { + "x": 713, + "y": 875, + "length": 141, + "thickness": 12, + "is_horizontal": true + }, + { + "x": 506, + "y": 413, + "length": 315, + "thickness": 8, + "is_horizontal": false + }, + { + "x": 704, + "y": 170, + "length": 223, + "thickness": 5, + "is_horizontal": true + }, + { + "x": 672, + "y": 55, + "length": 203, + "thickness": 8, + "is_horizontal": true + }, + { + "x": 600, + "y": 714, + "length": 135, + "thickness": 7, + "is_horizontal": true + }, + { + "x": 261, + "y": 408, + "length": 226, + "thickness": 11, + "is_horizontal": false + }, + { + "x": 407, + "y": 71, + "length": 211, + "thickness": 12, + "is_horizontal": false + }, + { + "x": 74, + "y": 912, + "length": 363, + "thickness": 5, + "is_horizontal": true + } + ] + }, + "param_hash": "a8f5d8c7a47eea46", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/prompt.txt b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c75696cf4915ac1f2125c0d14c3e1a7234ca4a59 --- /dev/null +++ b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000000/prompt.txt @@ -0,0 +1,3 @@ +The image contains several straight lines, including horizontal and vertical lines. +Circle every horizontal line. +Do not circle any vertical line. \ No newline at end of file diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/final_frame.png b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8ccedcacca82f5db0feabc67b2bec1679f4be783 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/final_frame.png differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/first_frame.png b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5c0f6551dc4a12b5bd286f14c20b15f2046e58eb Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/first_frame.png differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/ground_truth.mp4 b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a572ea400e06f7b367ad0b53c9c4fa0bdb2d597a Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/metadata.json b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..db8f0cf8af044912b3c954f504cf6f3e442a1c14 --- /dev/null +++ b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/metadata.json @@ -0,0 +1,103 @@ +{ + "task_id": "highlight_horizontal_lines_00000001", + "generator": "highlight_horizontal_lines", + "timestamp": "2026-02-17T07:00:07.271548", + "parameters": { + "lines": [ + { + "x": 400, + "y": 273, + "length": 201, + "thickness": 11, + "is_horizontal": true + }, + { + "x": 55, + "y": 625, + "length": 321, + "thickness": 11, + "is_horizontal": false + }, + { + "x": 918, + "y": 627, + "length": 199, + "thickness": 11, + "is_horizontal": false + }, + { + "x": 496, + "y": 563, + "length": 197, + "thickness": 7, + "is_horizontal": false + }, + { + "x": 228, + "y": 405, + "length": 162, + "thickness": 10, + "is_horizontal": true + }, + { + "x": 619, + "y": 472, + "length": 334, + "thickness": 8, + "is_horizontal": false + }, + { + "x": 777, + "y": 521, + "length": 320, + "thickness": 8, + "is_horizontal": false + }, + { + "x": 832, + "y": 170, + "length": 149, + "thickness": 10, + "is_horizontal": false + }, + { + "x": 629, + "y": 967, + "length": 287, + "thickness": 10, + "is_horizontal": true + }, + { + "x": 97, + "y": 231, + "length": 123, + "thickness": 9, + "is_horizontal": false + }, + { + "x": 311, + "y": 94, + "length": 318, + "thickness": 8, + "is_horizontal": true + }, + { + "x": 350, + "y": 644, + "length": 326, + "thickness": 5, + "is_horizontal": false + } + ] + }, + "param_hash": "0a1396d408a5281e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/prompt.txt b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c75696cf4915ac1f2125c0d14c3e1a7234ca4a59 --- /dev/null +++ b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000001/prompt.txt @@ -0,0 +1,3 @@ +The image contains several straight lines, including horizontal and vertical lines. +Circle every horizontal line. +Do not circle any vertical line. \ No newline at end of file diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/final_frame.png b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..33b6b2dbfed6190278fe1e6fc0ea4079c2508565 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/final_frame.png differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/first_frame.png b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e6ae837db7254fea27c1ae590e2b8931ec73bee3 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/first_frame.png differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/ground_truth.mp4 b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c27f587dfbfbea553ea04c212195da1a2f9bf595 Binary files /dev/null and b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/metadata.json b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6f0836e2972dbc291aeb766045e71208b94590 --- /dev/null +++ b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/metadata.json @@ -0,0 +1,96 @@ +{ + "task_id": "highlight_horizontal_lines_00000002", + "generator": "highlight_horizontal_lines", + "timestamp": "2026-02-17T07:00:09.740874", + "parameters": { + "lines": [ + { + "x": 616, + "y": 395, + "length": 309, + "thickness": 6, + "is_horizontal": true + }, + { + "x": 627, + "y": 857, + "length": 172, + "thickness": 6, + "is_horizontal": true + }, + { + "x": 62, + "y": 549, + "length": 256, + "thickness": 5, + "is_horizontal": false + }, + { + "x": 202, + "y": 762, + "length": 169, + "thickness": 9, + "is_horizontal": true + }, + { + "x": 641, + "y": 178, + "length": 222, + "thickness": 4, + "is_horizontal": true + }, + { + "x": 570, + "y": 590, + "length": 336, + "thickness": 12, + "is_horizontal": true + }, + { + "x": 196, + "y": 565, + "length": 266, + "thickness": 8, + "is_horizontal": true + }, + { + "x": 961, + "y": 104, + "length": 124, + "thickness": 12, + "is_horizontal": false + }, + { + "x": 205, + "y": 674, + "length": 232, + "thickness": 5, + "is_horizontal": true + }, + { + "x": 65, + "y": 405, + "length": 340, + "thickness": 6, + "is_horizontal": true + }, + { + "x": 493, + "y": 107, + "length": 219, + "thickness": 4, + "is_horizontal": false + } + ] + }, + "param_hash": "f4800daa242401bd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/prompt.txt b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c75696cf4915ac1f2125c0d14c3e1a7234ca4a59 --- /dev/null +++ b/VBVR-Dataset/highlight_horizontal_lines_task/highlight_horizontal_lines_00000002/prompt.txt @@ -0,0 +1,3 @@ +The image contains several straight lines, including horizontal and vertical lines. +Circle every horizontal line. +Do not circle any vertical line. \ No newline at end of file diff --git a/VBVR-Dataset/homography_task/homography_00000000/final_frame.png b/VBVR-Dataset/homography_task/homography_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..05221b6881d53bd95ee67063f715ce5ac7cfac60 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000000/final_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a43ce1f6fa304c77c838c6cbc1a6ca69a0f52fbd46ad733759e8823fbc921282 +size 1053747 diff --git a/VBVR-Dataset/homography_task/homography_00000000/first_frame.png b/VBVR-Dataset/homography_task/homography_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bc797619286be59e2ba6386fdeaff53e76a61bce --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000000/first_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16313640e46647abdc3017a6a1344980ddb7bc728b92f7366e84047352107144 +size 1590647 diff --git a/VBVR-Dataset/homography_task/homography_00000000/ground_truth.mp4 b/VBVR-Dataset/homography_task/homography_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..efc3802e982b4124773b25079d2440c3efae40ac --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08aa97ab1dcfafa0c2d5c2a06383d05f55cba42f628383ce389bf31d1d78c95d +size 874685 diff --git a/VBVR-Dataset/homography_task/homography_00000000/metadata.json b/VBVR-Dataset/homography_task/homography_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9be89617489bd611ad6619f8cc4b96e9e7da3a93 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000000/metadata.json @@ -0,0 +1,240 @@ +{ + "task_id": "homography_00000000", + "generator": "homography", + "timestamp": "2026-02-17T08:08:05.820081", + "parameters": { + "task_type": "default", + "grid_rows": 8, + "grid_cols": 8, + "show_target_mesh": true, + "objects": { + "source_quad": { + "symbol": "source_quad", + "type": "quad", + "vertices": [ + { + "index": 0, + "position": [ + 102.400002, + 102.400002 + ] + }, + { + "index": 1, + "position": [ + 921.599976, + 102.400002 + ] + }, + { + "index": 2, + "position": [ + 921.599976, + 921.599976 + ] + }, + { + "index": 3, + "position": [ + 102.400002, + 921.599976 + ] + } + ] + }, + "target_quad": { + "symbol": "target_quad", + "type": "quad", + "color": [ + 214, + 69, + 88 + ], + "color_name": "red", + "vertices": [ + { + "index": 0, + "position": [ + 320.0, + 384.0 + ] + }, + { + "index": 1, + "position": [ + 800.0, + 416.0 + ] + }, + { + "index": 2, + "position": [ + 864.0, + 864.0 + ] + }, + { + "index": 3, + "position": [ + 256.0, + 896.0 + ] + } + ] + }, + "noise_points": [ + { + "symbol": "noise_point_0", + "index": 0, + "position": [ + 8, + 264 + ], + "radius": 2, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_1", + "index": 1, + "position": [ + 872, + 312 + ], + "radius": 2, + "color": [ + 80, + 180, + 255 + ] + }, + { + "symbol": "noise_point_2", + "index": 2, + "position": [ + 680, + 824 + ], + "radius": 5, + "color": [ + 80, + 180, + 255 + ] + }, + { + "symbol": "noise_point_3", + "index": 3, + "position": [ + 712, + 152 + ], + "radius": 3, + "color": [ + 230, + 180, + 90 + ] + }, + { + "symbol": "noise_point_4", + "index": 4, + "position": [ + 536, + 40 + ], + "radius": 3, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_5", + "index": 5, + "position": [ + 680, + 744 + ], + "radius": 5, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_6", + "index": 6, + "position": [ + 904, + 824 + ], + "radius": 5, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_7", + "index": 7, + "position": [ + 712, + 40 + ], + "radius": 2, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_8", + "index": 8, + "position": [ + 40, + 1000 + ], + "radius": 3, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_9", + "index": 9, + "position": [ + 952, + 696 + ], + "radius": 3, + "color": [ + 230, + 180, + 90 + ] + } + ], + "occlusions": [] + } + }, + "param_hash": "85ec5cb5d306c3b9", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/homography_task/homography_00000000/prompt.txt b/VBVR-Dataset/homography_task/homography_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ac5689fef8dbfded565afc25cb6297bbf7d32b56 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000000/prompt.txt @@ -0,0 +1 @@ +Transform the blue grid by aligning its four corners to the four corners of the red quadrilateral. Apply a perspective transformation so the grid matches the red outline. Keep all background elements, colored dots, and gray patches unchanged. Output the transformed grid. \ No newline at end of file diff --git a/VBVR-Dataset/homography_task/homography_00000001/final_frame.png b/VBVR-Dataset/homography_task/homography_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3af015190dff5c33d1d6c8a4007c1a6f81908f7c --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000001/final_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cd21b04d8cea10b888acc40cff6c17aace3d6bdc5f1ebc0af955a7731e8dc6 +size 1676914 diff --git a/VBVR-Dataset/homography_task/homography_00000001/first_frame.png b/VBVR-Dataset/homography_task/homography_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3aa1d883ea604caf8a09d7f33a500a2047fc21a6 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000001/first_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49e393c556dbe456045a4751991dee9758707c5e31e8c4062e49c90c149c343 +size 1595332 diff --git a/VBVR-Dataset/homography_task/homography_00000001/ground_truth.mp4 b/VBVR-Dataset/homography_task/homography_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3fb9025daf04c08d2dc546f97e8f8a8ebae46576 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3bbe68f45870e022b83fba08cd7d1e13ac7d443f68793a6a0b0a788ce3aee4a +size 1154607 diff --git a/VBVR-Dataset/homography_task/homography_00000001/metadata.json b/VBVR-Dataset/homography_task/homography_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f920a3e9b28f95354282c152d36d4695beb49bc8 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000001/metadata.json @@ -0,0 +1,282 @@ +{ + "task_id": "homography_00000001", + "generator": "homography", + "timestamp": "2026-02-17T08:08:07.019818", + "parameters": { + "task_type": "default", + "grid_rows": 8, + "grid_cols": 8, + "show_target_mesh": true, + "objects": { + "source_quad": { + "symbol": "source_quad", + "type": "quad", + "vertices": [ + { + "index": 0, + "position": [ + 102.400002, + 102.400002 + ] + }, + { + "index": 1, + "position": [ + 921.599976, + 102.400002 + ] + }, + { + "index": 2, + "position": [ + 921.599976, + 921.599976 + ] + }, + { + "index": 3, + "position": [ + 102.400002, + 921.599976 + ] + } + ] + }, + "target_quad": { + "symbol": "target_quad", + "type": "quad", + "color": [ + 214, + 69, + 88 + ], + "color_name": "red", + "vertices": [ + { + "index": 0, + "position": [ + 192.0, + 192.0 + ] + }, + { + "index": 1, + "position": [ + 608.0, + 224.0 + ] + }, + { + "index": 2, + "position": [ + 928.0, + 768.0 + ] + }, + { + "index": 3, + "position": [ + 192.0, + 800.0 + ] + } + ] + }, + "noise_points": [ + { + "symbol": "noise_point_0", + "index": 0, + "position": [ + 888, + 408 + ], + "radius": 2, + "color": [ + 230, + 180, + 90 + ] + }, + { + "symbol": "noise_point_1", + "index": 1, + "position": [ + 712, + 360 + ], + "radius": 3, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_2", + "index": 2, + "position": [ + 536, + 888 + ], + "radius": 2, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_3", + "index": 3, + "position": [ + 1000, + 1000 + ], + "radius": 2, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_4", + "index": 4, + "position": [ + 680, + 264 + ], + "radius": 5, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_5", + "index": 5, + "position": [ + 584, + 440 + ], + "radius": 2, + "color": [ + 230, + 180, + 90 + ] + }, + { + "symbol": "noise_point_6", + "index": 6, + "position": [ + 856, + 744 + ], + "radius": 4, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_7", + "index": 7, + "position": [ + 840, + 856 + ], + "radius": 4, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_8", + "index": 8, + "position": [ + 792, + 872 + ], + "radius": 4, + "color": [ + 230, + 180, + 90 + ] + }, + { + "symbol": "noise_point_9", + "index": 9, + "position": [ + 616, + 936 + ], + "radius": 4, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_10", + "index": 10, + "position": [ + 536, + 248 + ], + "radius": 4, + "color": [ + 230, + 180, + 90 + ] + }, + { + "symbol": "noise_point_11", + "index": 11, + "position": [ + 792, + 936 + ], + "radius": 5, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_12", + "index": 12, + "position": [ + 408, + 456 + ], + "radius": 2, + "color": [ + 230, + 180, + 90 + ] + } + ], + "occlusions": [] + } + }, + "param_hash": "b2307353334e9ea6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/homography_task/homography_00000001/prompt.txt b/VBVR-Dataset/homography_task/homography_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ac5689fef8dbfded565afc25cb6297bbf7d32b56 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000001/prompt.txt @@ -0,0 +1 @@ +Transform the blue grid by aligning its four corners to the four corners of the red quadrilateral. Apply a perspective transformation so the grid matches the red outline. Keep all background elements, colored dots, and gray patches unchanged. Output the transformed grid. \ No newline at end of file diff --git a/VBVR-Dataset/homography_task/homography_00000002/final_frame.png b/VBVR-Dataset/homography_task/homography_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8fec7e8e80f8933f8036ac34d5803d02076079f0 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000002/final_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df378dc894fdc4a644a33f32f7fd33092f810afe2225923244bb1e38a3825e5e +size 1663785 diff --git a/VBVR-Dataset/homography_task/homography_00000002/first_frame.png b/VBVR-Dataset/homography_task/homography_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a00a6fd710e5ad7f1a6e31922a4c97c86ae8cc6f --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000002/first_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707c3d4b3d06b07a6943c0d180e7cedb971738e0a806b48946ab1b333516d085 +size 1594905 diff --git a/VBVR-Dataset/homography_task/homography_00000002/ground_truth.mp4 b/VBVR-Dataset/homography_task/homography_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..98b8730470c26fe7e39f750a30162dd1bfbaa742 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd0254186459fdd47d900367b62cf0f27e67b3af5f726c478fe51ad3b37da45 +size 1096013 diff --git a/VBVR-Dataset/homography_task/homography_00000002/metadata.json b/VBVR-Dataset/homography_task/homography_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..505d0ac7342caa7f0e80786139d3f30ba863818d --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000002/metadata.json @@ -0,0 +1,198 @@ +{ + "task_id": "homography_00000002", + "generator": "homography", + "timestamp": "2026-02-17T08:08:08.206566", + "parameters": { + "task_type": "default", + "grid_rows": 8, + "grid_cols": 8, + "show_target_mesh": true, + "objects": { + "source_quad": { + "symbol": "source_quad", + "type": "quad", + "vertices": [ + { + "index": 0, + "position": [ + 102.400002, + 102.400002 + ] + }, + { + "index": 1, + "position": [ + 921.599976, + 102.400002 + ] + }, + { + "index": 2, + "position": [ + 921.599976, + 921.599976 + ] + }, + { + "index": 3, + "position": [ + 102.400002, + 921.599976 + ] + } + ] + }, + "target_quad": { + "symbol": "target_quad", + "type": "quad", + "color": [ + 214, + 69, + 88 + ], + "color_name": "red", + "vertices": [ + { + "index": 0, + "position": [ + 96.0, + 256.0 + ] + }, + { + "index": 1, + "position": [ + 576.0, + 288.0 + ] + }, + { + "index": 2, + "position": [ + 800.0, + 576.0 + ] + }, + { + "index": 3, + "position": [ + 96.0, + 576.0 + ] + } + ] + }, + "noise_points": [ + { + "symbol": "noise_point_0", + "index": 0, + "position": [ + 280, + 120 + ], + "radius": 5, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_1", + "index": 1, + "position": [ + 936, + 472 + ], + "radius": 5, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_2", + "index": 2, + "position": [ + 488, + 520 + ], + "radius": 4, + "color": [ + 255, + 92, + 92 + ] + }, + { + "symbol": "noise_point_3", + "index": 3, + "position": [ + 984, + 328 + ], + "radius": 3, + "color": [ + 230, + 180, + 90 + ] + }, + { + "symbol": "noise_point_4", + "index": 4, + "position": [ + 72, + 568 + ], + "radius": 2, + "color": [ + 80, + 200, + 120 + ] + }, + { + "symbol": "noise_point_5", + "index": 5, + "position": [ + 8, + 744 + ], + "radius": 2, + "color": [ + 80, + 180, + 255 + ] + }, + { + "symbol": "noise_point_6", + "index": 6, + "position": [ + 504, + 568 + ], + "radius": 3, + "color": [ + 80, + 200, + 120 + ] + } + ], + "occlusions": [] + } + }, + "param_hash": "6680633b714b598b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/homography_task/homography_00000002/prompt.txt b/VBVR-Dataset/homography_task/homography_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ac5689fef8dbfded565afc25cb6297bbf7d32b56 --- /dev/null +++ b/VBVR-Dataset/homography_task/homography_00000002/prompt.txt @@ -0,0 +1 @@ +Transform the blue grid by aligning its four corners to the four corners of the red quadrilateral. Apply a perspective transformation so the grid matches the red outline. Keep all background elements, colored dots, and gray patches unchanged. Output the transformed grid. \ No newline at end of file diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/final_frame.png b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..154b79ffa7efbb8e4cbf1cf6110b0b1d947f090f Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/final_frame.png differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/first_frame.png b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2e49970fde5da0507d7a074917af64e122e4da02 Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/first_frame.png differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/ground_truth.mp4 b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8727637105e6b786dccd10c1c57f80274d65ed85 Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/metadata.json b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ed7c8b4ad08fbda740682e86fd3e77a43cdc2cad --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/metadata.json @@ -0,0 +1,67 @@ +{ + "task_id": "identify_figure_in_overlapping_area_00000000", + "generator": "identify_figure_in_overlapping_area", + "timestamp": "2026-02-17T06:51:21.529209", + "parameters": { + "shape_a": { + "type": "diamond", + "color": [ + 76, + 156, + 245 + ], + "vertices": [ + [ + 544.0, + 533.0 + ], + [ + 661.0, + 650.0 + ], + [ + 544.0, + 767.0 + ], + [ + 427.0, + 650.0 + ] + ], + "center": [ + 544.0, + 650.0 + ], + "size": [ + 234.0, + 234.0 + ] + }, + "shape_b": { + "type": "ellipse", + "color": [ + 161, + 157, + 64 + ], + "center": [ + 414.0, + 529.0 + ], + "size": [ + 189.0, + 110.0 + ] + } + }, + "param_hash": "4629d1e12eeb97c0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/prompt.txt b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..5138ebb33c0e536264bdb7c7da6921dafc9ce9cb --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows two translucent shapes that partially overlap: a diamond and a ellipse. First locate the region covered by both shapes (their intersection), then outline the exact boundary of that overlapping region with a red line. Show the complete outlining process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/final_frame.png b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..10b69bed3878f57aeb856147f39cdffb345399d4 Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/final_frame.png differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/first_frame.png b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ac6315407f0a48a12c48c44be2c887151a843aa8 Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/first_frame.png differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/ground_truth.mp4 b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d03a25d9a8f5c59b4baf1bcfa13d0ccc5cd933bd --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f3f6ba2bc946fba23edb1e7c5557dcc8eb9942d092c062041e18f47bb27256 +size 107430 diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/metadata.json b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..204de5f91a7b7cd6b1955cec226cfdf8469f14a7 --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/metadata.json @@ -0,0 +1,43 @@ +{ + "task_id": "identify_figure_in_overlapping_area_00000001", + "generator": "identify_figure_in_overlapping_area", + "timestamp": "2026-02-17T06:51:22.066772", + "parameters": { + "shape_a": { + "type": "circle", + "color": [ + 84, + 244, + 202 + ], + "center": [ + 720.0, + 577.0 + ], + "size": 190.0 + }, + "shape_b": { + "type": "circle", + "color": [ + 214, + 150, + 194 + ], + "center": [ + 521.0, + 691.0 + ], + "size": 180.0 + } + }, + "param_hash": "ab56aca5730a6efa", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/prompt.txt b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8b4c7ea44660537a340ffc0c8b72971179ebaa16 --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows two translucent shapes that partially overlap: a circle and a circle. First locate the region covered by both shapes (their intersection), then outline the exact boundary of that overlapping region with a red line. Show the complete outlining process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/final_frame.png b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..30d0fb4099fbabd7b3ed9bd8bb06013dbd2373e9 Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/final_frame.png differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/first_frame.png b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3e115d0b55bd6cd287eab9bd41eca48b58757d2e Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/first_frame.png differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/ground_truth.mp4 b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..18114e44acfb0ea087c72dc3b77f532435423f0a Binary files /dev/null and b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/metadata.json b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..817b51254622eea56b5037f017e0c1eeb34025f5 --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/metadata.json @@ -0,0 +1,46 @@ +{ + "task_id": "identify_figure_in_overlapping_area_00000002", + "generator": "identify_figure_in_overlapping_area", + "timestamp": "2026-02-17T06:51:22.614880", + "parameters": { + "shape_a": { + "type": "ellipse", + "color": [ + 220, + 155, + 58 + ], + "center": [ + 583.0, + 548.0 + ], + "size": [ + 194.0, + 110.0 + ] + }, + "shape_b": { + "type": "circle", + "color": [ + 205, + 142, + 61 + ], + "center": [ + 400.0, + 709.0 + ], + "size": 192.0 + } + }, + "param_hash": "8d7e5e2a47af04d0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/prompt.txt b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb58e6a5c92169b42d919bb8f0b0144a241f3e6d --- /dev/null +++ b/VBVR-Dataset/identify_figure_in_overlapping_area_task/identify_figure_in_overlapping_area_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows two translucent shapes that partially overlap: a ellipse and a circle. First locate the region covered by both shapes (their intersection), then outline the exact boundary of that overlapping region with a red line. Show the complete outlining process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/final_frame.png b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e0f7d6792b45d5d797c72cbe58bc4c67e92cfed1 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/final_frame.png differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/first_frame.png b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bf23b68ba61ad8d7a2f0ad9c3f7b949e2b335b23 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/first_frame.png differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/ground_truth.mp4 b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f4dbca5c6cb55f989f545180e8a8eede11e60f75 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/metadata.json b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6c75e4e1a19d4b4214edb90f7b651003d24f5776 --- /dev/null +++ b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/metadata.json @@ -0,0 +1,168 @@ +{ + "task_id": "identify_objects_in_region_00000000", + "generator": "identify_objects_in_region", + "timestamp": "2026-02-17T07:35:57.561810", + "parameters": { + "regions": [ + { + "id": 0, + "type": "rectangle", + "position": "left" + }, + { + "id": 1, + "type": "circle", + "position": "right" + } + ], + "shapes": [ + { + "type": "circle", + "color": [ + 30, + 142, + 153 + ], + "region_id": 0, + "position": [ + 265, + 511 + ], + "size": 70, + "is_target": true + }, + { + "type": "square", + "color": [ + 30, + 153, + 71 + ], + "region_id": 0, + "position": [ + 400, + 633 + ], + "size": 67, + "is_target": false + }, + { + "type": "square", + "color": [ + 215, + 229, + 114 + ], + "region_id": 0, + "position": [ + 130, + 511 + ], + "size": 71, + "is_target": false + }, + { + "type": "triangle", + "color": [ + 76, + 76, + 153 + ], + "region_id": 0, + "position": [ + 265, + 389 + ], + "size": 70, + "is_target": false + }, + { + "type": "triangle", + "color": [ + 153, + 30, + 81 + ], + "region_id": 1, + "position": [ + 704, + 350 + ], + "size": 58, + "is_target": false + }, + { + "type": "circle", + "color": [ + 132, + 30, + 153 + ], + "region_id": 1, + "position": [ + 812, + 458 + ], + "size": 58, + "is_target": false + }, + { + "type": "circle", + "color": [ + 153, + 53, + 111 + ], + "region_id": 1, + "position": [ + 704, + 458 + ], + "size": 61, + "is_target": false + }, + { + "type": "square", + "color": [ + 114, + 229, + 186 + ], + "region_id": 1, + "position": [ + 754, + 654 + ], + "size": 60, + "is_target": false + }, + { + "type": "triangle", + "color": [ + 30, + 112, + 153 + ], + "region_id": 1, + "position": [ + 920, + 458 + ], + "size": 60, + "is_target": false + } + ], + "target_region_id": 0, + "target_shape_type": "circle" + }, + "param_hash": "d41b37c57b49ca70", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/prompt.txt b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3f62fdc489b40dd07f0e95ffaf0c5be7885f9f9b --- /dev/null +++ b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000000/prompt.txt @@ -0,0 +1 @@ +Outline all circles in the square region with a green border. Only outline objects within that region. \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/final_frame.png b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..57eb0fc5180bffbfb789f66756a9f0fb407283e6 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/final_frame.png differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/first_frame.png b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fdfef8e724cb1bd64fe38f77406eabe23f08b69b Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/first_frame.png differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/ground_truth.mp4 b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d357c37a601faf788e47880b3b7dcd7ed9205769 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/metadata.json b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..420bfd6be6d2c7dcf071aa18bde80e46b75a2da0 --- /dev/null +++ b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/metadata.json @@ -0,0 +1,108 @@ +{ + "task_id": "identify_objects_in_region_00000001", + "generator": "identify_objects_in_region", + "timestamp": "2026-02-17T07:35:57.797804", + "parameters": { + "regions": [ + { + "id": 0, + "type": "circle", + "position": "left" + }, + { + "id": 1, + "type": "rectangle", + "position": "right" + } + ], + "shapes": [ + { + "type": "trapezoid", + "color": [ + 45, + 229, + 130 + ], + "region_id": 0, + "position": [ + 266, + 512 + ], + "size": 70, + "is_target": false + }, + { + "type": "triangle", + "color": [ + 45, + 229, + 130 + ], + "region_id": 0, + "position": [ + 374, + 404 + ], + "size": 70, + "is_target": false + }, + { + "type": "square", + "color": [ + 61, + 153, + 53 + ], + "region_id": 1, + "position": [ + 892, + 511 + ], + "size": 84, + "is_target": false + }, + { + "type": "triangle", + "color": [ + 114, + 157, + 229 + ], + "region_id": 1, + "position": [ + 622, + 389 + ], + "size": 85, + "is_target": true + }, + { + "type": "triangle", + "color": [ + 53, + 153, + 119 + ], + "region_id": 1, + "position": [ + 622, + 633 + ], + "size": 83, + "is_target": true + } + ], + "target_region_id": 1, + "target_shape_type": "triangle" + }, + "param_hash": "c226c2d2ac12213b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/prompt.txt b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2af6436dc56463d0813273312cfdb5b8c60c8e8b --- /dev/null +++ b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000001/prompt.txt @@ -0,0 +1 @@ +Outline all triangles in the square region with a green border. Only outline objects within that region. \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/final_frame.png b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1ff1f3eaca0a8789d40dd21980630b4f036652b5 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/final_frame.png differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/first_frame.png b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3d133e96262dfd6d793d12da877432ef759e4339 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/first_frame.png differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/ground_truth.mp4 b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a8d6efacaed9bf69a9318f9b81579baf0f349c54 Binary files /dev/null and b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/metadata.json b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fc084bb5377e9392b4007b3067bc139561af2232 --- /dev/null +++ b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/metadata.json @@ -0,0 +1,153 @@ +{ + "task_id": "identify_objects_in_region_00000002", + "generator": "identify_objects_in_region", + "timestamp": "2026-02-17T07:35:58.034459", + "parameters": { + "regions": [ + { + "id": 0, + "type": "circle", + "position": "left" + }, + { + "id": 1, + "type": "rectangle", + "position": "right" + } + ], + "shapes": [ + { + "type": "triangle", + "color": [ + 80, + 229, + 123 + ], + "region_id": 0, + "position": [ + 122, + 512 + ], + "size": 82, + "is_target": false + }, + { + "type": "triangle", + "color": [ + 132, + 30, + 153 + ], + "region_id": 0, + "position": [ + 266, + 512 + ], + "size": 85, + "is_target": false + }, + { + "type": "square", + "color": [ + 153, + 119, + 53 + ], + "region_id": 0, + "position": [ + 266, + 656 + ], + "size": 87, + "is_target": true + }, + { + "type": "circle", + "color": [ + 30, + 142, + 153 + ], + "region_id": 1, + "position": [ + 605, + 466 + ], + "size": 60, + "is_target": false + }, + { + "type": "trapezoid", + "color": [ + 153, + 76, + 114 + ], + "region_id": 1, + "position": [ + 807, + 558 + ], + "size": 61, + "is_target": false + }, + { + "type": "square", + "color": [ + 215, + 229, + 114 + ], + "region_id": 1, + "position": [ + 908, + 466 + ], + "size": 58, + "is_target": false + }, + { + "type": "trapezoid", + "color": [ + 148, + 229, + 80 + ], + "region_id": 1, + "position": [ + 623, + 589 + ], + "size": 60, + "is_target": false + }, + { + "type": "circle", + "color": [ + 94, + 53, + 153 + ], + "region_id": 1, + "position": [ + 706, + 466 + ], + "size": 60, + "is_target": false + } + ], + "target_region_id": 0, + "target_shape_type": "square" + }, + "param_hash": "79dbd30cca6caac6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/prompt.txt b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d8e3587a7feb1e02ede103510a08ee641c03d2d --- /dev/null +++ b/VBVR-Dataset/identify_objects_in_region_task/identify_objects_in_region_00000002/prompt.txt @@ -0,0 +1 @@ +Outline all squares in the circular region with a green border. Only outline objects within that region. \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000000/final_frame.png b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..937ee06545cd4f0a3257f6a7b0a944bf78f084e7 Binary files /dev/null and b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/final_frame.png differ diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000000/first_frame.png b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..86d20810c2670ca8a8681a3440a5fb49b3bdb8f7 Binary files /dev/null and b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/first_frame.png differ diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000000/ground_truth.mp4 b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b268ee3baf1174416afa9340ae158e96daca0815 --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b2e099abb71edc04165263eaa862b45eee19176d057e52d19765b9e73825d1 +size 117340 diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000000/metadata.json b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..68f0e469d3f890402ec392e12affd14e027683e0 --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/metadata.json @@ -0,0 +1,60 @@ +{ + "task_id": "identify_objects_00000000", + "generator": "identify_objects", + "timestamp": "2026-02-17T07:31:53.247392", + "parameters": { + "objects": [ + { + "shape": "triangle", + "color": "blue", + "size": 108, + "position": [ + 428, + 386 + ], + "is_target": false + }, + { + "shape": "rectangle", + "color": "red", + "size": 120, + "position": [ + 741, + 124 + ], + "is_target": false + }, + { + "shape": "hexagon", + "color": "orange", + "size": 84, + "position": [ + 217, + 109 + ], + "is_target": true + } + ], + "target_criteria": { + "shape": "hexagon", + "color": "orange", + "focus": "both" + }, + "type": "specific_combination", + "outline_color": [ + 0, + 0, + 255 + ] + }, + "param_hash": "15e990ae106b9e4d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000000/prompt.txt b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c713d858e88dd215b3492bb4bbbbe6cde4974700 --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000000/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple objects of different shapes and colors arranged randomly. Keep all objects unchanged in their shape, color, size, and position. Identify all orange hexagons and mark them by adding a thick blue outline around each one. \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000001/final_frame.png b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dccd502e7f6d324f78bcf268d13ea6c2f1b2bc14 Binary files /dev/null and b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/final_frame.png differ diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000001/first_frame.png b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0c1e160137f5d64232761faf6bc9d878e02260f5 Binary files /dev/null and b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/first_frame.png differ diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000001/ground_truth.mp4 b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e568cbb41f4d1259b6d39435e60776c6d45e0e6f --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d88dcd41b827f483409542fe89db9c9d3cd48a09f62083490e71fa7dee10f28 +size 136686 diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000001/metadata.json b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..62ba151f87c7850f7d7bede548233212337f1ebb --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/metadata.json @@ -0,0 +1,70 @@ +{ + "task_id": "identify_objects_00000001", + "generator": "identify_objects", + "timestamp": "2026-02-17T07:31:54.201272", + "parameters": { + "objects": [ + { + "shape": "square", + "color": "red", + "size": 114, + "position": [ + 544, + 849 + ], + "is_target": true + }, + { + "shape": "hexagon", + "color": "red", + "size": 90, + "position": [ + 816, + 470 + ], + "is_target": false + }, + { + "shape": "pentagon", + "color": "yellow", + "size": 93, + "position": [ + 686, + 723 + ], + "is_target": false + }, + { + "shape": "circle", + "color": "green", + "size": 110, + "position": [ + 619, + 464 + ], + "is_target": false + } + ], + "target_criteria": { + "shape": "square", + "color": "red", + "focus": "color" + }, + "type": "color_focus", + "outline_color": [ + 0, + 0, + 255 + ] + }, + "param_hash": "20c94d0e31f9b455", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000001/prompt.txt b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..980b398ddfbb1792d7d763bfd27355cac106e15e --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000001/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple objects of different shapes and colors arranged randomly. Keep all objects unchanged in their shape, color, size, and position. Identify all red objects and mark them by adding a thick blue outline around each one. \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000002/final_frame.png b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ff32e95b30a7e4a70416c100f6f97dd2bac1496e Binary files /dev/null and b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/final_frame.png differ diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000002/first_frame.png b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..54b714780d9a4695325a11f1e5b1308d09b49257 Binary files /dev/null and b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/first_frame.png differ diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000002/ground_truth.mp4 b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3068620d68c4d357168836c388b47bb4b1b0b75a --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee03f29298d15b412fcd03e107e24c57db49fda56569244838bee83afb4c5926 +size 157481 diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000002/metadata.json b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7ee6534ddedd30224f8746ed43d1e67d7436617c --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/metadata.json @@ -0,0 +1,60 @@ +{ + "task_id": "identify_objects_00000002", + "generator": "identify_objects", + "timestamp": "2026-02-17T07:31:55.110061", + "parameters": { + "objects": [ + { + "shape": "circle", + "color": "orange", + "size": 87, + "position": [ + 436, + 309 + ], + "is_target": true + }, + { + "shape": "circle", + "color": "orange", + "size": 93, + "position": [ + 487, + 885 + ], + "is_target": true + }, + { + "shape": "circle", + "color": "orange", + "size": 99, + "position": [ + 599, + 103 + ], + "is_target": true + } + ], + "target_criteria": { + "shape": "circle", + "color": "orange", + "focus": "both" + }, + "type": "specific_combination", + "outline_color": [ + 0, + 0, + 255 + ] + }, + "param_hash": "bfebd3500ce35e41", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_objects_task/identify_objects_00000002/prompt.txt b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ad5f6cc39f6c94aeab15f183f0e214a5f62d7f67 --- /dev/null +++ b/VBVR-Dataset/identify_objects_task/identify_objects_00000002/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple objects of different shapes and colors arranged randomly. Keep all objects unchanged in their shape, color, size, and position. Identify all orange circles and mark them by adding a thick blue outline around each one. \ No newline at end of file diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/final_frame.png b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4b638971224d3e10f50b4ecd0fde65d069c966ed Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/final_frame.png differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/first_frame.png b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2c9f2b6f67654515e3b13d882d2095bf0e1d3e57 Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/first_frame.png differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/ground_truth.mp4 b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8f5884dedd496596d7119ce82e74cb92fbd8279a Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/metadata.json b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dc70a30287c4898ece4e43a3d71344f67725b8c1 --- /dev/null +++ b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "identify_one_and_nine_00000000", + "generator": "identify_one_and_nine", + "timestamp": "2026-02-17T06:58:55.165118", + "parameters": { + "numbers": [ + { + "value": 2, + "position": [ + 915.0, + 864.0 + ] + }, + { + "value": 7, + "position": [ + 175.0, + 507.0 + ] + }, + { + "value": 9, + "position": [ + 438.0, + 471.0 + ] + }, + { + "value": 8, + "position": [ + 138.0, + 196.0 + ] + }, + { + "value": 6, + "position": [ + 906.0, + 131.0 + ] + }, + { + "value": 1, + "position": [ + 784.0, + 464.0 + ] + } + ], + "target_numbers": [ + 1, + 9 + ] + }, + "param_hash": "9bec07c3b4104946", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/prompt.txt b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4403c6b01dec55bb91e0f30f729fb03d4dae7ad0 --- /dev/null +++ b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000000/prompt.txt @@ -0,0 +1,4 @@ +The image shows a subset of digits chosen from 1 to 9 placed in different positions. +Find digit 1 and digit 9. +Only circle digits '1' and '9'. Do not circle other digits. +Draw a red circle around each target digit. \ No newline at end of file diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/final_frame.png b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..61d4d865c37951097682f50f188fe29214496c52 Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/final_frame.png differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/first_frame.png b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..55e0d2d7d97c8db5af11e0ca19c3f5f2a33f14dc Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/first_frame.png differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/ground_truth.mp4 b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..21c87a15e51b337c0863654f3ffce40e7b16bc20 Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/metadata.json b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..61c3eb323e7324d8869624f60ec221d45ef40cd8 --- /dev/null +++ b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "identify_one_and_nine_00000001", + "generator": "identify_one_and_nine", + "timestamp": "2026-02-17T06:58:56.298497", + "parameters": { + "numbers": [ + { + "value": 1, + "position": [ + 535.0, + 907.0 + ] + }, + { + "value": 9, + "position": [ + 183.0, + 237.0 + ] + }, + { + "value": 2, + "position": [ + 526.0, + 104.0 + ] + }, + { + "value": 5, + "position": [ + 779.0, + 793.0 + ] + }, + { + "value": 6, + "position": [ + 125.0, + 446.0 + ] + }, + { + "value": 7, + "position": [ + 182.0, + 837.0 + ] + }, + { + "value": 4, + "position": [ + 919.0, + 130.0 + ] + }, + { + "value": 3, + "position": [ + 561.0, + 496.0 + ] + } + ], + "target_numbers": [ + 1, + 9 + ] + }, + "param_hash": "358e0f40ba107443", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/prompt.txt b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4403c6b01dec55bb91e0f30f729fb03d4dae7ad0 --- /dev/null +++ b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000001/prompt.txt @@ -0,0 +1,4 @@ +The image shows a subset of digits chosen from 1 to 9 placed in different positions. +Find digit 1 and digit 9. +Only circle digits '1' and '9'. Do not circle other digits. +Draw a red circle around each target digit. \ No newline at end of file diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/final_frame.png b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c941dd4f5ef770e7375cfcf1578227b3eb3ac0f2 Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/final_frame.png differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/first_frame.png b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..395ae0eab5e747ddf716589da5c06cc7cbe2faab Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/first_frame.png differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/ground_truth.mp4 b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6e7206b929d763af438c5b62f5978c71f3b4d58b Binary files /dev/null and b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/metadata.json b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9883acf016aa7c97e7837ae9b0112675857bc3b1 --- /dev/null +++ b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "identify_one_and_nine_00000002", + "generator": "identify_one_and_nine", + "timestamp": "2026-02-17T06:58:57.460934", + "parameters": { + "numbers": [ + { + "value": 3, + "position": [ + 161.0, + 894.0 + ] + }, + { + "value": 1, + "position": [ + 460.0, + 789.0 + ] + }, + { + "value": 6, + "position": [ + 784.0, + 580.0 + ] + }, + { + "value": 2, + "position": [ + 902.0, + 909.0 + ] + }, + { + "value": 8, + "position": [ + 183.0, + 573.0 + ] + }, + { + "value": 5, + "position": [ + 548.0, + 152.0 + ] + }, + { + "value": 9, + "position": [ + 792.0, + 211.0 + ] + }, + { + "value": 7, + "position": [ + 481.0, + 486.0 + ] + } + ], + "target_numbers": [ + 1, + 9 + ] + }, + "param_hash": "473c358873f2392e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/prompt.txt b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4403c6b01dec55bb91e0f30f729fb03d4dae7ad0 --- /dev/null +++ b/VBVR-Dataset/identify_one_and_nine_task/identify_one_and_nine_00000002/prompt.txt @@ -0,0 +1,4 @@ +The image shows a subset of digits chosen from 1 to 9 placed in different positions. +Find digit 1 and digit 9. +Only circle digits '1' and '9'. Do not circle other digits. +Draw a red circle around each target digit. \ No newline at end of file diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/final_frame.png b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bc4a7b2da97d317707d26c3f0eee437dd29d18b4 Binary files /dev/null and b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/final_frame.png differ diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/first_frame.png b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b3dc0a6df3475a1660b4f21c34ad24d97941c5a6 Binary files /dev/null and b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/first_frame.png differ diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/ground_truth.mp4 b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6bd87c9e2aa4cb7ddf8d1ea98ca6e59d1a4f452f --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98837b0ba12d5c98b7bfcad30f1b6f82e060e4651a9ea77cf0cb9eaa90e2b88 +size 131435 diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/metadata.json b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7767ecb58301f891ed2d5b9d6cba461859dee733 --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/metadata.json @@ -0,0 +1,76 @@ +{ + "task_id": "identify_polygon_with_most_sides_00000000", + "generator": "identify_polygon_with_most_sides", + "timestamp": "2026-02-17T06:53:37.371260", + "parameters": { + "shapes": [ + { + "type": "polygon", + "color": [ + 221, + 192, + 188 + ], + "center": [ + 204.8, + 512.0 + ], + "num_edges": 7, + "size": 44.904763 + }, + { + "type": "polygon", + "color": [ + 171, + 200, + 164 + ], + "center": [ + 409.6, + 512.0 + ], + "num_edges": 9, + "size": 59.180614 + }, + { + "type": "polygon", + "color": [ + 229, + 230, + 214 + ], + "center": [ + 614.4, + 512.0 + ], + "num_edges": 8, + "size": 81.067192 + }, + { + "type": "polygon", + "color": [ + 184, + 227, + 150 + ], + "center": [ + 819.2, + 512.0 + ], + "num_edges": 7, + "size": 46.657695 + } + ], + "target_index": 1 + }, + "param_hash": "9b2b6872eee63501", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/prompt.txt b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..90534aa4ba4ffc72a0fa30d95175e087c311c3e8 --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000000/prompt.txt @@ -0,0 +1 @@ +Circle the shape with the most sides among several shapes placed side by side. \ No newline at end of file diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/final_frame.png b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b92cb04ff7a52fdc98ea996f3408c106de67eccd Binary files /dev/null and b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/final_frame.png differ diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/first_frame.png b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b0b631513154954961f0b687995ef6a14d31bcd1 Binary files /dev/null and b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/first_frame.png differ diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/ground_truth.mp4 b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..9b2a8a5424b043a867cf75f5e164598b8d18ae7e --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7dbe7c5c92bb0a03399949dc3a8e7efa70d9e4c08c391ce0a43828757cf386 +size 120188 diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/metadata.json b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..80e70189aedff29412a2eda99773405a1b763c14 --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/metadata.json @@ -0,0 +1,76 @@ +{ + "task_id": "identify_polygon_with_most_sides_00000001", + "generator": "identify_polygon_with_most_sides", + "timestamp": "2026-02-17T06:53:37.769330", + "parameters": { + "shapes": [ + { + "type": "polygon", + "color": [ + 169, + 156, + 181 + ], + "center": [ + 204.8, + 512.0 + ], + "num_edges": 4, + "size": 58.473166 + }, + { + "type": "polygon", + "color": [ + 209, + 176, + 194 + ], + "center": [ + 409.6, + 512.0 + ], + "num_edges": 3, + "size": 57.46592 + }, + { + "type": "polygon", + "color": [ + 210, + 229, + 183 + ], + "center": [ + 614.4, + 512.0 + ], + "num_edges": 3, + "size": 66.699112 + }, + { + "type": "polygon", + "color": [ + 192, + 217, + 196 + ], + "center": [ + 819.2, + 512.0 + ], + "num_edges": 3, + "size": 47.960226 + } + ], + "target_index": 0 + }, + "param_hash": "d0d205a92418ed0f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/prompt.txt b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..90534aa4ba4ffc72a0fa30d95175e087c311c3e8 --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000001/prompt.txt @@ -0,0 +1 @@ +Circle the shape with the most sides among several shapes placed side by side. \ No newline at end of file diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/final_frame.png b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2c83681cee09bec9ac49821aea9033f972b38251 Binary files /dev/null and b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/final_frame.png differ diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/first_frame.png b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..24cfe906080e5b85901b6e24fd5ae0672c6e03c3 Binary files /dev/null and b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/first_frame.png differ diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/ground_truth.mp4 b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a7ddb5469002f627c0f0697e03176a37422296e7 --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2445aa88629d2f9732fac1740675b610622b47dd6a6242293bbd39ab230a009c +size 150002 diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/metadata.json b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..2c70d630f3bcb647106e94cad842af5341766c9d --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/metadata.json @@ -0,0 +1,76 @@ +{ + "task_id": "identify_polygon_with_most_sides_00000002", + "generator": "identify_polygon_with_most_sides", + "timestamp": "2026-02-17T06:53:38.164904", + "parameters": { + "shapes": [ + { + "type": "polygon", + "color": [ + 228, + 201, + 213 + ], + "center": [ + 204.8, + 512.0 + ], + "num_edges": 6, + "size": 64.703573 + }, + { + "type": "polygon", + "color": [ + 152, + 220, + 165 + ], + "center": [ + 409.6, + 512.0 + ], + "num_edges": 5, + "size": 63.154265 + }, + { + "type": "polygon", + "color": [ + 152, + 212, + 177 + ], + "center": [ + 614.4, + 512.0 + ], + "num_edges": 9, + "size": 79.490847 + }, + { + "type": "polygon", + "color": [ + 193, + 177, + 199 + ], + "center": [ + 819.2, + 512.0 + ], + "num_edges": 5, + "size": 69.865276 + } + ], + "target_index": 2 + }, + "param_hash": "c4c759dffd382263", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/prompt.txt b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..90534aa4ba4ffc72a0fa30d95175e087c311c3e8 --- /dev/null +++ b/VBVR-Dataset/identify_polygon_with_most_sides_task/identify_polygon_with_most_sides_00000002/prompt.txt @@ -0,0 +1 @@ +Circle the shape with the most sides among several shapes placed side by side. \ No newline at end of file diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/final_frame.png b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..733be866d7c10c1391e993473efc6972692759e1 --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/final_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597f437ca7b53209fc7e91ee8d733c1837b0d2589710d393a3d64265bc19304c +size 104729 diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/first_frame.png b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..781e29244df5b4d07633446ba1c266fc3e31a28f Binary files /dev/null and b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/first_frame.png differ diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/ground_truth.mp4 b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..62784bad31c80f78e1a33f4cc3990236266f3bb3 --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ba187bfcfa0d24f41112d73a6a195b642a3587efc2c76d2c92d3011c5baf6e3 +size 296189 diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/metadata.json b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6509ff8c4df7a102bd92b02fd1d9e2eb8148826a --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "ink_diffusion_00000000", + "generator": "ink_diffusion", + "timestamp": "2026-02-17T08:09:41.168223", + "parameters": { + "ink_color_rgb": [ + 255, + 218, + 185 + ], + "ink_color_name": "colored", + "ink_to_water_ratio": 0.003049, + "final_concentration": 0.8, + "diffusion_coefficient": 1.925867, + "temperature_factor": 1.06708, + "video_duration_seconds": 8.0, + "total_frames": 128, + "fps": 16, + "objects": { + "beaker": { + "symbol": "beaker", + "type": "container", + "shape": "cone_up", + "shape_name": "flask-shaped", + "bounds": { + "left": 317, + "right": 706, + "top": 256, + "bottom": 911 + }, + "width": 389, + "height": 655, + "water_surface_y": 406, + "water_fill_ratio": 0.82, + "water_volume_ml": 164.0 + }, + "droplet": { + "symbol": "droplet", + "type": "ink_droplet", + "color": [ + 255, + 218, + 185 + ], + "color_name": "colored", + "initial_position": [ + 518.3075, + 176.0 + ], + "position_ratio": 0.05, + "volume_ml": 0.5 + } + } + }, + "param_hash": "8e254b1e2c5f0013", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/prompt.txt b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cda20f3f49976ec7ba3cc2977dec8a96e23f1bcf --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000000/prompt.txt @@ -0,0 +1 @@ +An ink droplet falls from above the center of a glass beaker filled with water. Upon entering the water, the ink forms irregular downward-extending tendrils due to gravity and initial impact. The ink then diffuses through the water, creating swirling patterns and eddies, until it reaches a stable state of uniform color distribution throughout the entire volume of water. \ No newline at end of file diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/final_frame.png b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..73c0906d624aaa98a0c9a4a1a5dacaa73acd4acd --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/final_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d959866801f77bf426becb702d66a68df85eea5e0b09ed3ee43e416b62adf45b +size 124481 diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/first_frame.png b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1bde28924db0bf2a6c298f0112df6e598960b0c0 Binary files /dev/null and b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/first_frame.png differ diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/ground_truth.mp4 b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..868d55a72c735eca4f0828fa0544caac9398b2c7 --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a5be6d1b1c8a45724559d73bdcae76ae7453a85a0df6c186f4a3c96c496b70 +size 669669 diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/metadata.json b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..191c28c70b8abfadfb673537749c753cae17dd98 --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "ink_diffusion_00000001", + "generator": "ink_diffusion", + "timestamp": "2026-02-17T08:09:52.506854", + "parameters": { + "ink_color_rgb": [ + 123, + 104, + 238 + ], + "ink_color_name": "slate-blue", + "ink_to_water_ratio": 0.003049, + "final_concentration": 0.8, + "diffusion_coefficient": 1.925867, + "temperature_factor": 1.06708, + "video_duration_seconds": 8.0, + "total_frames": 128, + "fps": 16, + "objects": { + "beaker": { + "symbol": "beaker", + "type": "container", + "shape": "cone_up", + "shape_name": "flask-shaped", + "bounds": { + "left": 317, + "right": 706, + "top": 256, + "bottom": 911 + }, + "width": 389, + "height": 655, + "water_surface_y": 406, + "water_fill_ratio": 0.82, + "water_volume_ml": 164.0 + }, + "droplet": { + "symbol": "droplet", + "type": "ink_droplet", + "color": [ + 123, + 104, + 238 + ], + "color_name": "slate-blue", + "initial_position": [ + 520.009375, + 176.0 + ], + "position_ratio": 0.0625, + "volume_ml": 0.5 + } + } + }, + "param_hash": "9aea00e0b035ab45", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/prompt.txt b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cda20f3f49976ec7ba3cc2977dec8a96e23f1bcf --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000001/prompt.txt @@ -0,0 +1 @@ +An ink droplet falls from above the center of a glass beaker filled with water. Upon entering the water, the ink forms irregular downward-extending tendrils due to gravity and initial impact. The ink then diffuses through the water, creating swirling patterns and eddies, until it reaches a stable state of uniform color distribution throughout the entire volume of water. \ No newline at end of file diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/final_frame.png b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d6e41d87a8f6def0aa6a72d865f67927b067a289 --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/final_frame.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50196e799d039fdabfbf02815226d5d2e76d9be8bc481ab8d04a42fadc6e2539 +size 111287 diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/first_frame.png b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a2de1055fbbcaedf59b9f813b309a8b15ee5d525 Binary files /dev/null and b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/first_frame.png differ diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/ground_truth.mp4 b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..246265efc9ce60fa248c9c5cb64fac154f9a5e5a --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2dc2236411e43dbfd3dd9a1566abb1dcdb4e9668dad42977f551638e442263 +size 381903 diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/metadata.json b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1e93503265c8034a847068f367b18c035dba31dd --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "ink_diffusion_00000002", + "generator": "ink_diffusion", + "timestamp": "2026-02-17T08:10:03.239042", + "parameters": { + "ink_color_rgb": [ + 144, + 238, + 144 + ], + "ink_color_name": "colored", + "ink_to_water_ratio": 0.003049, + "final_concentration": 0.8, + "diffusion_coefficient": 1.925867, + "temperature_factor": 1.06708, + "video_duration_seconds": 8.0, + "total_frames": 128, + "fps": 16, + "objects": { + "beaker": { + "symbol": "beaker", + "type": "container", + "shape": "cone_up", + "shape_name": "flask-shaped", + "bounds": { + "left": 317, + "right": 706, + "top": 256, + "bottom": 911 + }, + "width": 389, + "height": 655, + "water_surface_y": 406, + "water_fill_ratio": 0.82, + "water_volume_ml": 164.0 + }, + "droplet": { + "symbol": "droplet", + "type": "ink_droplet", + "color": [ + 144, + 238, + 144 + ], + "color_name": "colored", + "initial_position": [ + 521.71125, + 176.0 + ], + "position_ratio": 0.075, + "volume_ml": 0.5 + } + } + }, + "param_hash": "da1acdf848cc0894", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/prompt.txt b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cda20f3f49976ec7ba3cc2977dec8a96e23f1bcf --- /dev/null +++ b/VBVR-Dataset/ink_diffusion_task/ink_diffusion_00000002/prompt.txt @@ -0,0 +1 @@ +An ink droplet falls from above the center of a glass beaker filled with water. Upon entering the water, the ink forms irregular downward-extending tendrils due to gravity and initial impact. The ink then diffuses through the water, creating swirling patterns and eddies, until it reaches a stable state of uniform color distribution throughout the entire volume of water. \ No newline at end of file diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/final_frame.png b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3cbf957449b5b03beda33c0c0cd9abbd73fa6929 Binary files /dev/null and b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/final_frame.png differ diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/first_frame.png b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d7217441e9648de93de93c08e26865bc333b7b6a Binary files /dev/null and b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/first_frame.png differ diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/ground_truth.mp4 b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3f0687f05ba75c4e09caf1f6b181f31a3890f74f --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1573ea92e96fa3a5ad3f519b0b24ba14e565f9a2322564d57d9cac59972e6833 +size 410977 diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/metadata.json b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..c6a0246d5996dcc4df7911a343bbd29ae230df73 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/metadata.json @@ -0,0 +1,114 @@ +{ + "task_id": "key_door_matching_00000000", + "generator": "key_door_matching", + "timestamp": "2026-02-17T07:29:12.792362", + "parameters": { + "style": "grid", + "agent_start_position": [ + 1, + 1 + ], + "keys": [ + { + "pos": [ + 3, + 11 + ], + "color": [ + 255, + 0, + 0 + ] + }, + { + "pos": [ + 5, + 9 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "pos": [ + 11, + 3 + ], + "color": [ + 255, + 255, + 0 + ] + } + ], + "doors": [ + { + "pos": [ + 7, + 5 + ], + "color": [ + 255, + 0, + 0 + ] + }, + { + "pos": [ + 9, + 3 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "pos": [ + 8, + 9 + ], + "color": [ + 255, + 255, + 0 + ] + } + ], + "target_color": [ + 0, + 0, + 255 + ], + "grid": [ + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1], + [1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1] + ], + "width": 13, + "height": 13 + }, + "param_hash": "37062bbeac5d3545", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/prompt.txt b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9c197062fb132aee6b07186c12cfd1ba009d0c36 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a maze with a green circular agent, colored diamond-shaped keys, and colored hollow rectangular doors. Find the Blue key and then navigate to the matching Blue door, showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/final_frame.png b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e1a47f0b803db17a260a958b7f535c8333955545 Binary files /dev/null and b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/final_frame.png differ diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/first_frame.png b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4f026bded88cde00da1d9013fa68d10201c8cbe5 Binary files /dev/null and b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/first_frame.png differ diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/ground_truth.mp4 b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c361c6d27f39046863b6334b0393cf479d644ece --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a90a1907e45e336a8bb8e3bf704536a49d22113336f4bd5543d5fa6d8f008d5 +size 328955 diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/metadata.json b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3fa2cb81dce0ffce088f97db55fc673e3a93f2f2 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/metadata.json @@ -0,0 +1,114 @@ +{ + "task_id": "key_door_matching_00000001", + "generator": "key_door_matching", + "timestamp": "2026-02-17T07:29:13.415263", + "parameters": { + "style": "grid", + "agent_start_position": [ + 1, + 1 + ], + "keys": [ + { + "pos": [ + 7, + 1 + ], + "color": [ + 255, + 0, + 0 + ] + }, + { + "pos": [ + 9, + 1 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "pos": [ + 11, + 5 + ], + "color": [ + 255, + 255, + 0 + ] + } + ], + "doors": [ + { + "pos": [ + 5, + 9 + ], + "color": [ + 255, + 0, + 0 + ] + }, + { + "pos": [ + 11, + 11 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "pos": [ + 1, + 11 + ], + "color": [ + 255, + 255, + 0 + ] + } + ], + "target_color": [ + 255, + 255, + 0 + ], + "grid": [ + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], + [1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1], + [1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1], + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1] + ], + "width": 13, + "height": 13 + }, + "param_hash": "dc6d742dba348d33", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/prompt.txt b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..37d06c5044c2dadcd6ac9f93a5711ec7d0df51d7 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a maze with a green circular agent, colored diamond-shaped keys, and colored hollow rectangular doors. Find the Yellow key and then navigate to the matching Yellow door, showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/final_frame.png b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bd1a025b1ed3c6704c86a7a2e6411e2cd126f58a Binary files /dev/null and b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/final_frame.png differ diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/first_frame.png b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4acbb2b8d75c20fb844aef32e7b186b43ef9fe5e Binary files /dev/null and b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/first_frame.png differ diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/ground_truth.mp4 b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..68485f50f1d4cd75ebb5655c1733a5efb1d8bd79 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faee48138ebc51127014496b8397f334330d6de30906475c78beaee4a509fdb7 +size 412533 diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/metadata.json b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ae039589ffc1ed12749bc1ff4a795a8b4d8c8f83 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/metadata.json @@ -0,0 +1,114 @@ +{ + "task_id": "key_door_matching_00000002", + "generator": "key_door_matching", + "timestamp": "2026-02-17T07:29:14.241006", + "parameters": { + "style": "grid", + "agent_start_position": [ + 1, + 1 + ], + "keys": [ + { + "pos": [ + 1, + 9 + ], + "color": [ + 255, + 0, + 0 + ] + }, + { + "pos": [ + 11, + 7 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "pos": [ + 9, + 2 + ], + "color": [ + 255, + 255, + 0 + ] + } + ], + "doors": [ + { + "pos": [ + 3, + 5 + ], + "color": [ + 255, + 0, + 0 + ] + }, + { + "pos": [ + 9, + 5 + ], + "color": [ + 0, + 0, + 255 + ] + }, + { + "pos": [ + 3, + 9 + ], + "color": [ + 255, + 255, + 0 + ] + } + ], + "target_color": [ + 255, + 0, + 0 + ], + "grid": [ + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], + [1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 0, 1], + [1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 0, 1, 0, 1, 1, 1], + [1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1], + [1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1], + [1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1], + [1, 0, 1, 1, 1, 0, 1, 1, 1, 0, 1, 0, 1], + [1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1], + [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1] + ], + "width": 13, + "height": 13 + }, + "param_hash": "be8cd28440c5b039", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/prompt.txt b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ecbd8715992ba32a617ac40c3a7482504d950d81 --- /dev/null +++ b/VBVR-Dataset/key_door_matching_task/key_door_matching_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a maze with a green circular agent, colored diamond-shaped keys, and colored hollow rectangular doors. Find the Red key and then navigate to the matching Red door, showing the complete movement process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/final_frame.png b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4323a71516084c913ca269a6ea634e1d0e8f9a46 Binary files /dev/null and b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/final_frame.png differ diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/first_frame.png b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3f805a989157175975df302e4be58cae1acb718b Binary files /dev/null and b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/first_frame.png differ diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/ground_truth.mp4 b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..72a4691f355f684c0b65285c5e349cd44eb8fac7 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5990fca69912199878f424fd6a2db7b03c2e7d04a37f79b465669fae012c78 +size 315269 diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/metadata.json b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4df37cff325cb082df1def260e10fa170983c864 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/metadata.json @@ -0,0 +1,131 @@ +{ + "task_id": "lego_construction_assembly_00000000", + "generator": "lego_construction_assembly", + "timestamp": "2026-02-17T07:45:06.910079", + "parameters": { + "step": 3, + "model_type": "base_add", + "model_name": "Base3_Add2_6132", + "new_brick_index": 3, + "objects": [ + { + "symbol": "brick", + "brick_type": "1x2", + "color": "white", + "position": [ + 1, + 0, + 0 + ], + "center_3d": [ + 1.5, + 1.0, + 1.5 + ], + "center_2d": [ + 703, + 714 + ], + "rotation": 0, + "size": [ + 1, + 2, + 3 + ], + "is_new": false, + "step_index": 0 + }, + { + "symbol": "brick", + "brick_type": "1x2", + "color": "white", + "position": [ + 2, + 0, + 0 + ], + "center_3d": [ + 2.5, + 1.0, + 1.5 + ], + "center_2d": [ + 746, + 739 + ], + "rotation": 0, + "size": [ + 1, + 2, + 3 + ], + "is_new": false, + "step_index": 1 + }, + { + "symbol": "brick", + "brick_type": "1x2", + "color": "white", + "position": [ + 1, + 2, + 0 + ], + "center_3d": [ + 1.5, + 3.0, + 1.5 + ], + "center_2d": [ + 617, + 764 + ], + "rotation": 0, + "size": [ + 1, + 2, + 3 + ], + "is_new": false, + "step_index": 2 + }, + { + "symbol": "brick", + "brick_type": "2x2", + "color": "blue", + "position": [ + 1, + 4, + 0 + ], + "center_3d": [ + 2.0, + 5.0, + 1.5 + ], + "center_2d": [ + 552, + 827 + ], + "rotation": 90, + "size": [ + 2, + 2, + 3 + ], + "is_new": true, + "step_index": 3 + } + ] + }, + "param_hash": "c6325613ad6fd900", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/prompt.txt b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..73fc0ce4be4b830ad7b7a93d902bc8a4ada5a928 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000000/prompt.txt @@ -0,0 +1 @@ +This is LEGO assembly step 4. The scene shows a partial model on the right and a 2x2 blue brick on the left in a callout box. Take the blue brick and attach it to the model at the position indicated by the red arrow. Move the brick smoothly from the callout to its destination, align it correctly, and snap it into place. \ No newline at end of file diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/final_frame.png b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..adf6d48b5fcdb65736136b35ce3b381c4f300e72 Binary files /dev/null and b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/final_frame.png differ diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/first_frame.png b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..55e3b559e88c151d0c100ea8ebf22066764af0f3 Binary files /dev/null and b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/first_frame.png differ diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/ground_truth.mp4 b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..555080d9be2b1fb23adad63bfafb8e8106873878 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f32e379c2c3baba02471cdeacfabeacd688757cbe775669cccb10318435a474 +size 326834 diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/metadata.json b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f96fcfe2f2e639cb23184327e2fdb38def5b8466 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/metadata.json @@ -0,0 +1,77 @@ +{ + "task_id": "lego_construction_assembly_00000001", + "generator": "lego_construction_assembly", + "timestamp": "2026-02-17T07:45:07.570989", + "parameters": { + "step": 1, + "model_type": "base_add", + "model_name": "Base1_Add1_4375", + "new_brick_index": 1, + "objects": [ + { + "symbol": "brick", + "brick_type": "2x4", + "color": "white", + "position": [ + 3, + 0, + 0 + ], + "center_3d": [ + 4.0, + 2.0, + 1.5 + ], + "center_2d": [ + 768, + 802 + ], + "rotation": 0, + "size": [ + 2, + 4, + 3 + ], + "is_new": false, + "step_index": 0 + }, + { + "symbol": "brick", + "brick_type": "2x2", + "color": "green", + "position": [ + 5, + 0, + 0 + ], + "center_3d": [ + 6.0, + 1.0, + 1.5 + ], + "center_2d": [ + 898, + 827 + ], + "rotation": 90, + "size": [ + 2, + 2, + 3 + ], + "is_new": true, + "step_index": 1 + } + ] + }, + "param_hash": "1a25f03d5163e484", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/prompt.txt b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4b6068f59822465337cf2a7efd70870ab70d5344 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000001/prompt.txt @@ -0,0 +1 @@ +This is LEGO assembly step 2. The scene shows a partial model on the right and a 2x2 green brick on the left in a callout box. Take the green brick and attach it to the model at the position indicated by the red arrow. Move the brick smoothly from the callout to its destination, align it correctly, and snap it into place. \ No newline at end of file diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/final_frame.png b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..aa052adf5835c1f0e9c42f34e2f4b0f618edcbd0 Binary files /dev/null and b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/final_frame.png differ diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/first_frame.png b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5605d7e8f84950c6fcde6aedaa4026ab47cf5ef2 Binary files /dev/null and b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/first_frame.png differ diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/ground_truth.mp4 b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..19a68d705985de6da3b888fc13eac05014c0f81f --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1205ba39c0c7381c496542271d7d193614fce0f6cb5fe64a5d3591f3272265f +size 415342 diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/metadata.json b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a922a178f102871bcb73acd3a91fef09540f79bd --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/metadata.json @@ -0,0 +1,158 @@ +{ + "task_id": "lego_construction_assembly_00000002", + "generator": "lego_construction_assembly", + "timestamp": "2026-02-17T07:45:08.192216", + "parameters": { + "step": 4, + "model_type": "wall", + "model_name": "L-Wall", + "new_brick_index": 4, + "objects": [ + { + "symbol": "brick", + "brick_type": "2x4", + "color": "red", + "position": [ + 0, + 0, + 0 + ], + "center_3d": [ + 1.0, + 2.0, + 1.5 + ], + "center_2d": [ + 638, + 727 + ], + "rotation": 0, + "size": [ + 2, + 4, + 3 + ], + "is_new": false, + "step_index": 0 + }, + { + "symbol": "brick", + "brick_type": "2x4", + "color": "red", + "position": [ + 0, + 4, + 0 + ], + "center_3d": [ + 1.0, + 6.0, + 1.5 + ], + "center_2d": [ + 465, + 827 + ], + "rotation": 0, + "size": [ + 2, + 4, + 3 + ], + "is_new": false, + "step_index": 1 + }, + { + "symbol": "brick", + "brick_type": "2x2", + "color": "red", + "position": [ + 0, + 8, + 0 + ], + "center_3d": [ + 1.0, + 9.0, + 1.5 + ], + "center_2d": [ + 335, + 902 + ], + "rotation": 0, + "size": [ + 2, + 2, + 3 + ], + "is_new": false, + "step_index": 2 + }, + { + "symbol": "brick", + "brick_type": "2x4", + "color": "blue", + "position": [ + 0, + 0, + 3 + ], + "center_3d": [ + 1.0, + 2.0, + 4.5 + ], + "center_2d": [ + 638, + 667 + ], + "rotation": 0, + "size": [ + 2, + 4, + 3 + ], + "is_new": false, + "step_index": 3 + }, + { + "symbol": "brick", + "brick_type": "2x4", + "color": "blue", + "position": [ + 0, + 4, + 3 + ], + "center_3d": [ + 1.0, + 6.0, + 4.5 + ], + "center_2d": [ + 465, + 767 + ], + "rotation": 0, + "size": [ + 2, + 4, + 3 + ], + "is_new": true, + "step_index": 4 + } + ] + }, + "param_hash": "abf2530148540850", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/prompt.txt b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e3e15da3892992cc5f3b044f4d03a2224bbd9e8 --- /dev/null +++ b/VBVR-Dataset/lego_construction_assembly_task/lego_construction_assembly_00000002/prompt.txt @@ -0,0 +1 @@ +This is LEGO assembly step 5. The scene shows a partial model on the right and a 2x4 blue brick on the left in a callout box. Take the blue brick and attach it to the model at the position indicated by the red arrow. Move the brick smoothly from the callout to its destination, align it correctly, and snap it into place. \ No newline at end of file diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000000/final_frame.png b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..59f3ed0bdede05d54c907a09abf6669cf4d624d7 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/final_frame.png differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000000/first_frame.png b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1742f6d7a3e8b87775c8ee3745f032f4811084f1 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/first_frame.png differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000000/ground_truth.mp4 b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f267a7bcd4fe527460151014c1729ca872689851 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000000/metadata.json b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3be61530ad7234eeb39f4ef7814bec7d15edb5bd --- /dev/null +++ b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/metadata.json @@ -0,0 +1,45 @@ +{ + "task_id": "light_sequence_00000000", + "generator": "light_sequence", + "timestamp": "2026-02-17T07:50:39.531019", + "parameters": { + "num_lights": 6, + "task_type": 6, + "color": [ + 220, + 53, + 69 + ], + "color_name": "red", + "initial_states": [ + 0, + 0, + 1, + 1, + 1, + 1 + ], + "final_states": [ + 0, + 0, + 0, + 0, + 0, + 1 + ], + "task_type_params": { + "count": 1, + "side": "right" + } + }, + "param_hash": "97fba2896541ad05", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000000/prompt.txt b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c73c3414b6030dfd6280137d8605ec43302dfd13 --- /dev/null +++ b/VBVR-Dataset/light_sequence_task/light_sequence_00000000/prompt.txt @@ -0,0 +1,3 @@ +The scene shows 6 circular lights in a horizontal row on a white background. Lights on are red with glow; lights off are gray. Initially, some lights are on and some are off. + +Your task: Modify the light states so that the rightmost 1 lights (counting from left to right) are on (red with glow), and all other lights are off (gray). Turn lights on/off as needed. Lights change from gray to red (with glow) when turned on, and from red to gray (glow disappears) when turned off. Lights stay in fixed positions; only their states change. \ No newline at end of file diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000001/final_frame.png b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9459759b99e00aed9f78717d0a408d441d82ee70 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/final_frame.png differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000001/first_frame.png b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4eca163534fdb6390b8098c9b371b3f867ff4336 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/first_frame.png differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000001/ground_truth.mp4 b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..478d74f0b6ff21814c0db8eb7dc1014562eee89b Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000001/metadata.json b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..89f1fa87db1af26f24caefc17969278537b0067f --- /dev/null +++ b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/metadata.json @@ -0,0 +1,50 @@ +{ + "task_id": "light_sequence_00000000", + "generator": "light_sequence", + "timestamp": "2026-02-17T07:50:46.931376", + "parameters": { + "num_lights": 8, + "task_type": 1, + "color": [ + 255, + 215, + 0 + ], + "color_name": "gold", + "initial_states": [ + 1, + 1, + 0, + 1, + 0, + 0, + 0, + 0 + ], + "final_states": [ + 0, + 1, + 0, + 0, + 0, + 0, + 0, + 0 + ], + "task_type_params": { + "positions": [ + 2 + ] + } + }, + "param_hash": "d0d1234098ca63d3", + "generation": { + "seed": 1901164218, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000001/prompt.txt b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..1af6e39ef90df401c2cabed98c7904223b0209db --- /dev/null +++ b/VBVR-Dataset/light_sequence_task/light_sequence_00000001/prompt.txt @@ -0,0 +1,3 @@ +The scene shows 8 circular lights in a horizontal row on a white background. Lights on are gold/yellow with glow; lights off are gray. Initially, some lights are on and some are off. + +Your task: Modify the light states so that the 2nd light from the left (counting from left to right) is on (gold/yellow with glow), and all other lights are off (gray). Turn lights on/off as needed. Lights change from gray to gold/yellow (with glow) when turned on, and from gold/yellow to gray (glow disappears) when turned off. Lights stay in fixed positions; only their states change. \ No newline at end of file diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000002/final_frame.png b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6f2725a3d78f2bd90c6cae5628db4bb67e3ea2f6 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/final_frame.png differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000002/first_frame.png b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6f2725a3d78f2bd90c6cae5628db4bb67e3ea2f6 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/first_frame.png differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000002/ground_truth.mp4 b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3399b04424a8f906243f8f5236cda8cd5558aa91 Binary files /dev/null and b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000002/metadata.json b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fec842214a7eaf50e4ad9eab4dcc2c3fb7c9b67f --- /dev/null +++ b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/metadata.json @@ -0,0 +1,40 @@ +{ + "task_id": "light_sequence_00000002", + "generator": "light_sequence", + "timestamp": "2026-02-17T07:50:40.648262", + "parameters": { + "num_lights": 4, + "task_type": 4, + "color": [ + 255, + 192, + 203 + ], + "color_name": "pink", + "initial_states": [ + 0, + 0, + 1, + 1 + ], + "final_states": [ + 0, + 0, + 1, + 1 + ], + "task_type_params": { + "range": "right" + } + }, + "param_hash": "295e3be86de70568", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/light_sequence_task/light_sequence_00000002/prompt.txt b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d7b1165f33e14609f79430ba3b702beac736c595 --- /dev/null +++ b/VBVR-Dataset/light_sequence_task/light_sequence_00000002/prompt.txt @@ -0,0 +1,3 @@ +The scene shows 4 circular lights in a horizontal row on a white background. Lights on are pink with glow; lights off are gray. Initially, some lights are on and some are off. + +Your task: Modify the light states so that all lights in the right half of the row (the 2 lights from the right side, counting from left to right) are on (pink with glow), and all lights in the left half are off (gray). Turn lights on/off as needed. Lights change from gray to pink (with glow) when turned on, and from pink to gray (glow disappears) when turned off. Lights stay in fixed positions; only their states change. \ No newline at end of file diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/final_frame.png b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fc045f9f267ed7b074bc3b4b11bc2c16787da4ee Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/final_frame.png differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/first_frame.png b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bb57bf92861706dd73ce968155c19e53c03ab69f Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/first_frame.png differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/ground_truth.mp4 b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e33ad22351fb2cf8cc428a7b18102f301a527973 Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/metadata.json b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..887bfd78135a7576ff801b140210d287d6fb1e53 --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/metadata.json @@ -0,0 +1,97 @@ +{ + "task_id": "locate_line_intersections_00000000", + "generator": "locate_line_intersections", + "timestamp": "2026-02-17T07:06:55.699463", + "parameters": { + "lines": [ + { + "start": [ + 168, + 109 + ], + "end": [ + 568, + 641 + ], + "color": [ + 166, + 108, + 126 + ], + "thickness": 6 + }, + { + "start": [ + 419, + 150 + ], + "end": [ + 851, + 570 + ], + "color": [ + 149, + 150, + 134 + ], + "thickness": 4 + }, + { + "start": [ + 726, + 140 + ], + "end": [ + 299, + 590 + ], + "color": [ + 86, + 73, + 83 + ], + "thickness": 4 + }, + { + "start": [ + 154, + 393 + ], + "end": [ + 639, + 836 + ], + "color": [ + 138, + 152, + 144 + ], + "thickness": 5 + } + ], + "intersections": [ + [ + 427, + 454 + ], + [ + 573, + 300 + ], + [ + 331, + 555 + ] + ] + }, + "param_hash": "d65feda46e063c1d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/prompt.txt b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d287269558bd64ca965e72a669ee7837d6d631c --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000000/prompt.txt @@ -0,0 +1 @@ +Circle all intersection points of the line segments with red circles. \ No newline at end of file diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/final_frame.png b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a10515507b438d74911567278a80c9e08b6da40a Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/final_frame.png differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/first_frame.png b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9835c16136514591ac9acaa7b791e3001445a3ba Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/first_frame.png differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/ground_truth.mp4 b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..fe31f795c6f5be3338be1c7faca84f4109703f7c Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/metadata.json b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4b86297e48d94a2421fd5c24f9790342a0291e42 --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/metadata.json @@ -0,0 +1,109 @@ +{ + "task_id": "locate_line_intersections_00000001", + "generator": "locate_line_intersections", + "timestamp": "2026-02-17T07:06:55.899396", + "parameters": { + "lines": [ + { + "start": [ + 190, + 143 + ], + "end": [ + 615, + 583 + ], + "color": [ + 169, + 132, + 70 + ], + "thickness": 7 + }, + { + "start": [ + 445, + 189 + ], + "end": [ + 835, + 599 + ], + "color": [ + 112, + 108, + 127 + ], + "thickness": 6 + }, + { + "start": [ + 720, + 137 + ], + "end": [ + 329, + 587 + ], + "color": [ + 134, + 147, + 86 + ], + "thickness": 7 + }, + { + "start": [ + 119, + 396 + ], + "end": [ + 608, + 874 + ], + "color": [ + 96, + 127, + 148 + ], + "thickness": 5 + }, + { + "start": [ + 465, + 460 + ], + "end": [ + 855, + 905 + ], + "color": [ + 152, + 124, + 131 + ], + "thickness": 5 + } + ], + "intersections": [ + [ + 466, + 429 + ], + [ + 565, + 315 + ] + ] + }, + "param_hash": "1e435b9e5fca8407", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/prompt.txt b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d287269558bd64ca965e72a669ee7837d6d631c --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000001/prompt.txt @@ -0,0 +1 @@ +Circle all intersection points of the line segments with red circles. \ No newline at end of file diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/final_frame.png b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d86c7d2fa1da5cce9c54980f5709ce9b9ce54262 Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/final_frame.png differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/first_frame.png b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ffe870a983a3ee61e93e830b32a610e58053eef2 Binary files /dev/null and b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/first_frame.png differ diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/ground_truth.mp4 b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..83cf956c9678d591c1587b11842605e6a4e78328 --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7e598f696fc8546eb7e6a78999f53798cc806e62e6d3eb3949b3753cca4b46 +size 117181 diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/metadata.json b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..562a9a7a0f129fd2ef19c494c2dc38550c4bf365 --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/metadata.json @@ -0,0 +1,145 @@ +{ + "task_id": "locate_line_intersections_00000002", + "generator": "locate_line_intersections", + "timestamp": "2026-02-17T07:06:56.145795", + "parameters": { + "lines": [ + { + "start": [ + 155, + 190 + ], + "end": [ + 594, + 614 + ], + "color": [ + 115, + 103, + 144 + ], + "thickness": 6 + }, + { + "start": [ + 458, + 168 + ], + "end": [ + 907, + 629 + ], + "color": [ + 170, + 115, + 126 + ], + "thickness": 4 + }, + { + "start": [ + 697, + 158 + ], + "end": [ + 355, + 612 + ], + "color": [ + 95, + 98, + 84 + ], + "thickness": 6 + }, + { + "start": [ + 163, + 406 + ], + "end": [ + 610, + 869 + ], + "color": [ + 75, + 139, + 114 + ], + "thickness": 5 + }, + { + "start": [ + 413, + 376 + ], + "end": [ + 893, + 836 + ], + "color": [ + 129, + 162, + 102 + ], + "thickness": 5 + }, + { + "start": [ + 656, + 434 + ], + "end": [ + 348, + 843 + ], + "color": [ + 167, + 84, + 160 + ], + "thickness": 7 + } + ], + "intersections": [ + [ + 454, + 479 + ], + [ + 551, + 572 + ], + [ + 588, + 302 + ], + [ + 358, + 607 + ], + [ + 482, + 442 + ], + [ + 451, + 705 + ], + [ + 579, + 535 + ] + ] + }, + "param_hash": "a4351c907b03f695", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/prompt.txt b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9d287269558bd64ca965e72a669ee7837d6d631c --- /dev/null +++ b/VBVR-Dataset/locate_line_intersections_task/locate_line_intersections_00000002/prompt.txt @@ -0,0 +1 @@ +Circle all intersection points of the line segments with red circles. \ No newline at end of file diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/final_frame.png b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7209c4971d9db97e25816f45808147059edd0d71 Binary files /dev/null and b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/final_frame.png differ diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/first_frame.png b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..02f9f63b78fd47286e81f094fea8205f8ab60576 Binary files /dev/null and b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/first_frame.png differ diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/ground_truth.mp4 b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..734688b001bdb8f2040aefceefa1344351e30e9f --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:613832b5cb82a65f6e12468a98c4de23a058bace20910324d121bfc0c25756a1 +size 335845 diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/metadata.json b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1dd87c08c329f75df4fa51353958cef750021401 --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/metadata.json @@ -0,0 +1,44 @@ +{ + "task_id": "locate_twelve_o_clock_arrows_00000000", + "generator": "locate_twelve_o_clock_arrows", + "timestamp": "2026-02-17T06:58:20.948532", + "parameters": { + "clocks": [ + { + "center": [ + 749.0, + 298.0 + ], + "radius": 180.0, + "hour_angle": 62.298199 + }, + { + "center": [ + 373.0, + 603.0 + ], + "radius": 180.0, + "hour_angle": 0.0 + }, + { + "center": [ + 749.0, + 797.0 + ], + "radius": 180.0, + "hour_angle": 178.641672 + } + ], + "target_index": 1 + }, + "param_hash": "2dcfa44c1e6a0710", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/prompt.txt b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6feb7499b0770b5a62a4e8ede0d1eed49c7aed33 --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000000/prompt.txt @@ -0,0 +1 @@ +The image contains 3 clocks, each with only an hour hand. Exactly one clock has its hour hand pointing to 12 o'clock. First find the single clock pointing to 12 o'clock, then draw a red circle around it. Do not change anything else. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/final_frame.png b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..520ad5232e04e1df34827333d921f4a4b462fb6a Binary files /dev/null and b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/final_frame.png differ diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/first_frame.png b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a3a82485fb3a412170407e2ee079a316064ea6f6 Binary files /dev/null and b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/first_frame.png differ diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/ground_truth.mp4 b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..eb5ddb936a8a158f06da976c6f1070ade0976ced --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3751839070f7995c335d23e509065275c52ef0459a15808ce758bb8fd99b4a6 +size 347675 diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/metadata.json b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..201599c06e2afe751706b81dd64307cb9b1b6307 --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/metadata.json @@ -0,0 +1,44 @@ +{ + "task_id": "locate_twelve_o_clock_arrows_00000001", + "generator": "locate_twelve_o_clock_arrows", + "timestamp": "2026-02-17T06:58:21.341530", + "parameters": { + "clocks": [ + { + "center": [ + 557.0, + 273.0 + ], + "radius": 180.0, + "hour_angle": 325.023781 + }, + { + "center": [ + 538.0, + 737.0 + ], + "radius": 180.0, + "hour_angle": 0.0 + }, + { + "center": [ + 227.0, + 495.0 + ], + "radius": 180.0, + "hour_angle": 113.867882 + } + ], + "target_index": 1 + }, + "param_hash": "597900d53e2195e8", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/prompt.txt b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6feb7499b0770b5a62a4e8ede0d1eed49c7aed33 --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000001/prompt.txt @@ -0,0 +1 @@ +The image contains 3 clocks, each with only an hour hand. Exactly one clock has its hour hand pointing to 12 o'clock. First find the single clock pointing to 12 o'clock, then draw a red circle around it. Do not change anything else. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/final_frame.png b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..07bdb56d842abd5b5dceee94c57d3c1f4ba2daaf Binary files /dev/null and b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/final_frame.png differ diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/first_frame.png b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..96baa3bb043143d028d83e6b12060cfa4a4338e1 Binary files /dev/null and b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/first_frame.png differ diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/ground_truth.mp4 b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..92525e8d0d7f03644ea5989c6613e88f594343eb --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248813d2d4cfe2ec0b0b972e89f1e9587d917a8cf42add027a6ed5e7ab2cea62 +size 307881 diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/metadata.json b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6ecfd9e73ff7fb18a52ec9c469ba1f35d77252f4 --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/metadata.json @@ -0,0 +1,36 @@ +{ + "task_id": "locate_twelve_o_clock_arrows_00000002", + "generator": "locate_twelve_o_clock_arrows", + "timestamp": "2026-02-17T06:58:21.738576", + "parameters": { + "clocks": [ + { + "center": [ + 572.0, + 392.0 + ], + "radius": 180.0, + "hour_angle": 184.37427 + }, + { + "center": [ + 201.0, + 524.0 + ], + "radius": 180.0, + "hour_angle": 0.0 + } + ], + "target_index": 1 + }, + "param_hash": "1f32bb83cf9ae993", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/prompt.txt b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..01bb0934c66da3134519a24e09ce94cae1827a9f --- /dev/null +++ b/VBVR-Dataset/locate_twelve_o_clock_arrows_task/locate_twelve_o_clock_arrows_00000002/prompt.txt @@ -0,0 +1 @@ +The image contains 2 clocks, each with only an hour hand. Exactly one clock has its hour hand pointing to 12 o'clock. First find the single clock pointing to 12 o'clock, then draw a red circle around it. Do not change anything else. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/final_frame.png b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6cc7f9d7bef62f47486875c287ec911df63dbab0 Binary files /dev/null and b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/final_frame.png differ diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/first_frame.png b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d505f30d2f37b406f75415cf96a3d390a9c2168b Binary files /dev/null and b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/first_frame.png differ diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/ground_truth.mp4 b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ba86132177c6278337addc5e97914019305ef40c --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6dccb1111068b0d01f0e2eb7b6068e30fe91d999e5f45e938fb0ddc3d9f82e +size 176978 diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/metadata.json b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..944bb469c3f2664f654b710c0630d0bd5ed418ab --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "maintain_object_identity_different_objects_00000000", + "generator": "maintain_object_identity_different_objects", + "timestamp": "2026-02-17T07:18:16.667896", + "parameters": { + "object1": { + "original_position": "left", + "color": [ + 220, + 192, + 215 + ], + "size": 72, + "shape": "square" + }, + "object2": { + "original_position": "right", + "color": [ + 134, + 242, + 127 + ], + "size": 69, + "shape": "hexagon" + }, + "arrow": "original_right" + }, + "param_hash": "a12e3736fc44f690", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/prompt.txt b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..f750de7584648b49b4f30d8b45911ddc8f67b421 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000000/prompt.txt @@ -0,0 +1 @@ +The left object is white and the right object is green. The scene shows two objects, one on the left and one on the right. Swap the positions of the left and right objects. After the swap, draw an arrow below the object that was originally on the right, pointing up at it. \ No newline at end of file diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/final_frame.png b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3c331a3021496f241f6216c831903a7df8844f36 Binary files /dev/null and b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/final_frame.png differ diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/first_frame.png b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c3239bb57a81244df6850e2ed65cebd518d1bfae Binary files /dev/null and b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/first_frame.png differ diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/ground_truth.mp4 b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b2ca0b16abf414bd6d41b0771937f2c387ee8287 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c24ef0bee7504b77d09a3fa7e6ca89ffde9c200edfbe06eed684af6f71d2d84 +size 152825 diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/metadata.json b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3bd5ee115915b1b2c9e076e064c437dd1ee9db40 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "maintain_object_identity_different_objects_00000001", + "generator": "maintain_object_identity_different_objects", + "timestamp": "2026-02-17T07:18:17.466898", + "parameters": { + "object1": { + "original_position": "left", + "color": [ + 213, + 79, + 209 + ], + "size": 110, + "shape": "triangle" + }, + "object2": { + "original_position": "right", + "color": [ + 210, + 178, + 207 + ], + "size": 74, + "shape": "square" + }, + "arrow": "original_left" + }, + "param_hash": "d94733e16b165998", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/prompt.txt b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e22163534657c9eddc7a2b57364dca2f73229291 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000001/prompt.txt @@ -0,0 +1 @@ +The left object is red and the right object is orange. The scene shows two objects, one on the left and one on the right. Swap the positions of the left and right objects. After the swap, draw an arrow below the object that was originally on the left, pointing up at it. \ No newline at end of file diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/final_frame.png b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..24074fed425d02d39588dd85c7a3f73638078bc8 Binary files /dev/null and b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/final_frame.png differ diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/first_frame.png b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bf96fcf306e7763c56fb7782f992dc87871e6cb2 Binary files /dev/null and b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/first_frame.png differ diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/ground_truth.mp4 b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4d0f24041f7b7f7d89d707aa4a3fa39e8c47fd39 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae2d12e894d07ae25c0ceebba3d434586e62ccd4a4d627c3e0cfcbeca80ce9d +size 212043 diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/metadata.json b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..82022477803caa4155d5aca80325b51c4bc5a3f7 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/metadata.json @@ -0,0 +1,38 @@ +{ + "task_id": "maintain_object_identity_different_objects_00000002", + "generator": "maintain_object_identity_different_objects", + "timestamp": "2026-02-17T07:18:18.216647", + "parameters": { + "object1": { + "original_position": "left", + "color": [ + 83, + 56, + 76 + ], + "size": 137, + "shape": "triangle" + }, + "object2": { + "original_position": "right", + "color": [ + 159, + 217, + 88 + ], + "size": 60, + "shape": "pentagon" + }, + "arrow": "original_left" + }, + "param_hash": "6faac6936a0c1342", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/prompt.txt b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..12e1ae2de8087f38ae9cf48cfb16964a77934fb0 --- /dev/null +++ b/VBVR-Dataset/maintain_object_identity_different_objects_task/maintain_object_identity_different_objects_00000002/prompt.txt @@ -0,0 +1 @@ +The left object is gray and the right object is green. The scene shows two objects, one on the left and one on the right. Swap the positions of the left and right objects. After the swap, draw an arrow below the object that was originally on the left, pointing up at it. \ No newline at end of file diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000000/final_frame.png b/VBVR-Dataset/majority_color_task/majority_color_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f62c802673046704b3bf3823b95e979a9792a552 Binary files /dev/null and b/VBVR-Dataset/majority_color_task/majority_color_00000000/final_frame.png differ diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000000/first_frame.png b/VBVR-Dataset/majority_color_task/majority_color_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a372e65cd3547f70c6617f8564225d37d9e7c698 Binary files /dev/null and b/VBVR-Dataset/majority_color_task/majority_color_00000000/first_frame.png differ diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000000/ground_truth.mp4 b/VBVR-Dataset/majority_color_task/majority_color_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5c5243df0fdab7cf1f8ab661abc711c39447fde6 --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d57d9116b5afe90ad11885d1a97362911a5bf2660564bfb63a90811856161157 +size 214161 diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000000/metadata.json b/VBVR-Dataset/majority_color_task/majority_color_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..40213d2df5e69ddd5e70dacbf57a40dfe7aa2a55 --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000000/metadata.json @@ -0,0 +1,281 @@ +{ + "task_id": "majority_color_00000000", + "generator": "majority_color", + "timestamp": "2026-02-17T07:50:29.216346", + "parameters": { + "majority_color": [ + 255, + 0, + 0 + ], + "majority_color_name": "red", + "majority_count": 8, + "objects": [ + { + "symbol": "shape", + "index": 0, + "type": "triangle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 82, + 306 + ], + "size": 83, + "is_majority": true + }, + { + "symbol": "shape", + "index": 1, + "type": "rectangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 918, + 872 + ], + "size": 102, + "is_majority": false + }, + { + "symbol": "shape", + "index": 2, + "type": "circle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 106, + 389 + ], + "size": 41, + "is_majority": false + }, + { + "symbol": "shape", + "index": 3, + "type": "rectangle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 182, + 427 + ], + "size": 99, + "is_majority": true + }, + { + "symbol": "shape", + "index": 4, + "type": "rectangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 139, + 772 + ], + "size": 68, + "is_majority": false + }, + { + "symbol": "shape", + "index": 5, + "type": "ellipse", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 851, + 744 + ], + "size": 75, + "is_majority": true + }, + { + "symbol": "shape", + "index": 6, + "type": "circle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 826, + 313 + ], + "size": 92, + "is_majority": true + }, + { + "symbol": "shape", + "index": 7, + "type": "ellipse", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 428, + 690 + ], + "size": 49, + "is_majority": true + }, + { + "symbol": "shape", + "index": 8, + "type": "rectangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 422, + 167 + ], + "size": 77, + "is_majority": false + }, + { + "symbol": "shape", + "index": 9, + "type": "triangle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 311, + 179 + ], + "size": 77, + "is_majority": true + }, + { + "symbol": "shape", + "index": 10, + "type": "circle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 536, + 633 + ], + "size": 84, + "is_majority": true + }, + { + "symbol": "shape", + "index": 11, + "type": "triangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 927, + 849 + ], + "size": 101, + "is_majority": false + }, + { + "symbol": "shape", + "index": 12, + "type": "triangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 705, + 573 + ], + "size": 64, + "is_majority": false + }, + { + "symbol": "shape", + "index": 13, + "type": "ellipse", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 734, + 964 + ], + "size": 67, + "is_majority": true + }, + { + "symbol": "shape", + "index": 14, + "type": "circle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 300, + 325 + ], + "size": 97, + "is_majority": false + } + ] + }, + "param_hash": "e312ffdc6e54eada", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000000/prompt.txt b/VBVR-Dataset/majority_color_task/majority_color_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..64836033b97ab58a0dc085dedd12bfbd5ef2aa1d --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000000/prompt.txt @@ -0,0 +1 @@ +The image shows multiple colored objects. Count how many objects are of each color. Identify the majority color (the color with the most objects). Then make all objects of other colors vanish, while the majority color objects remain stationary. \ No newline at end of file diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000001/final_frame.png b/VBVR-Dataset/majority_color_task/majority_color_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5773b823cb5395e04a4f1d83a815918900d538b3 Binary files /dev/null and b/VBVR-Dataset/majority_color_task/majority_color_00000001/final_frame.png differ diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000001/first_frame.png b/VBVR-Dataset/majority_color_task/majority_color_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2e2f13d385bece9524314fc057148ca031c9103c Binary files /dev/null and b/VBVR-Dataset/majority_color_task/majority_color_00000001/first_frame.png differ diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000001/ground_truth.mp4 b/VBVR-Dataset/majority_color_task/majority_color_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5b1ae07de4321b8613188ce97ed63009fa4b7075 --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088816af436034e1a7a77629ca497eb775a08cf8f34592bcad047f83bbd34c51 +size 175959 diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000001/metadata.json b/VBVR-Dataset/majority_color_task/majority_color_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..297a8152ce34b0181e60fd831b8c71bdfcb30af5 --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000001/metadata.json @@ -0,0 +1,281 @@ +{ + "task_id": "majority_color_00000001", + "generator": "majority_color", + "timestamp": "2026-02-17T07:50:29.815188", + "parameters": { + "majority_color": [ + 0, + 255, + 0 + ], + "majority_color_name": "green", + "majority_count": 9, + "objects": [ + { + "symbol": "shape", + "index": 0, + "type": "triangle", + "color": [ + 255, + 255, + 0 + ], + "color_name": "yellow", + "center": [ + 424, + 382 + ], + "size": 42, + "is_majority": false + }, + { + "symbol": "shape", + "index": 1, + "type": "circle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 910, + 994 + ], + "size": 55, + "is_majority": false + }, + { + "symbol": "shape", + "index": 2, + "type": "triangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 176, + 162 + ], + "size": 58, + "is_majority": true + }, + { + "symbol": "shape", + "index": 3, + "type": "triangle", + "color": [ + 255, + 255, + 0 + ], + "color_name": "yellow", + "center": [ + 418, + 276 + ], + "size": 101, + "is_majority": false + }, + { + "symbol": "shape", + "index": 4, + "type": "triangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 757, + 648 + ], + "size": 43, + "is_majority": true + }, + { + "symbol": "shape", + "index": 5, + "type": "triangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 590, + 460 + ], + "size": 81, + "is_majority": true + }, + { + "symbol": "shape", + "index": 6, + "type": "ellipse", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 252, + 472 + ], + "size": 37, + "is_majority": true + }, + { + "symbol": "shape", + "index": 7, + "type": "circle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 934, + 344 + ], + "size": 52, + "is_majority": true + }, + { + "symbol": "shape", + "index": 8, + "type": "triangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 118, + 761 + ], + "size": 73, + "is_majority": true + }, + { + "symbol": "shape", + "index": 9, + "type": "rectangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 514, + 94 + ], + "size": 31, + "is_majority": false + }, + { + "symbol": "shape", + "index": 10, + "type": "rectangle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 134, + 469 + ], + "size": 98, + "is_majority": true + }, + { + "symbol": "shape", + "index": 11, + "type": "ellipse", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 62, + 455 + ], + "size": 62, + "is_majority": true + }, + { + "symbol": "shape", + "index": 12, + "type": "ellipse", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 173, + 438 + ], + "size": 50, + "is_majority": false + }, + { + "symbol": "shape", + "index": 13, + "type": "triangle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 735, + 870 + ], + "size": 62, + "is_majority": false + }, + { + "symbol": "shape", + "index": 14, + "type": "circle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 290, + 65 + ], + "size": 60, + "is_majority": true + } + ] + }, + "param_hash": "46d1c472bb84b4ef", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000001/prompt.txt b/VBVR-Dataset/majority_color_task/majority_color_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..64836033b97ab58a0dc085dedd12bfbd5ef2aa1d --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000001/prompt.txt @@ -0,0 +1 @@ +The image shows multiple colored objects. Count how many objects are of each color. Identify the majority color (the color with the most objects). Then make all objects of other colors vanish, while the majority color objects remain stationary. \ No newline at end of file diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000002/final_frame.png b/VBVR-Dataset/majority_color_task/majority_color_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9f7df4ad5675c9fc2a0cc5f44f366a1d12487a2a Binary files /dev/null and b/VBVR-Dataset/majority_color_task/majority_color_00000002/final_frame.png differ diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000002/first_frame.png b/VBVR-Dataset/majority_color_task/majority_color_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a3ed6040ecb93c4231fbfb8b9105ad36bb1117fa Binary files /dev/null and b/VBVR-Dataset/majority_color_task/majority_color_00000002/first_frame.png differ diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000002/ground_truth.mp4 b/VBVR-Dataset/majority_color_task/majority_color_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..9ffc00e63c58ebfaba749b8f7b494c2e7fa88db0 --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c33c76a067c38b96d5464d84b793f97b7cee0c3f2b01fdd65d1a38b4e62eea +size 179125 diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000002/metadata.json b/VBVR-Dataset/majority_color_task/majority_color_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..23ac69cd70b1b4b2cf24aff713a977666c8a1789 --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000002/metadata.json @@ -0,0 +1,281 @@ +{ + "task_id": "majority_color_00000002", + "generator": "majority_color", + "timestamp": "2026-02-17T07:50:30.412059", + "parameters": { + "majority_color": [ + 0, + 0, + 255 + ], + "majority_color_name": "blue", + "majority_count": 10, + "objects": [ + { + "symbol": "shape", + "index": 0, + "type": "triangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 987, + 804 + ], + "size": 36, + "is_majority": true + }, + { + "symbol": "shape", + "index": 1, + "type": "circle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 860, + 91 + ], + "size": 76, + "is_majority": true + }, + { + "symbol": "shape", + "index": 2, + "type": "circle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 378, + 843 + ], + "size": 94, + "is_majority": true + }, + { + "symbol": "shape", + "index": 3, + "type": "circle", + "color": [ + 0, + 255, + 0 + ], + "color_name": "green", + "center": [ + 759, + 276 + ], + "size": 101, + "is_majority": false + }, + { + "symbol": "shape", + "index": 4, + "type": "circle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 992, + 407 + ], + "size": 56, + "is_majority": false + }, + { + "symbol": "shape", + "index": 5, + "type": "triangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 93, + 513 + ], + "size": 31, + "is_majority": true + }, + { + "symbol": "shape", + "index": 6, + "type": "triangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 683, + 951 + ], + "size": 39, + "is_majority": true + }, + { + "symbol": "shape", + "index": 7, + "type": "rectangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 943, + 447 + ], + "size": 38, + "is_majority": true + }, + { + "symbol": "shape", + "index": 8, + "type": "rectangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 944, + 443 + ], + "size": 99, + "is_majority": true + }, + { + "symbol": "shape", + "index": 9, + "type": "ellipse", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 448, + 81 + ], + "size": 50, + "is_majority": true + }, + { + "symbol": "shape", + "index": 10, + "type": "rectangle", + "color": [ + 255, + 0, + 0 + ], + "color_name": "red", + "center": [ + 510, + 280 + ], + "size": 92, + "is_majority": false + }, + { + "symbol": "shape", + "index": 11, + "type": "rectangle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 205, + 337 + ], + "size": 69, + "is_majority": true + }, + { + "symbol": "shape", + "index": 12, + "type": "circle", + "color": [ + 0, + 0, + 255 + ], + "color_name": "blue", + "center": [ + 418, + 244 + ], + "size": 90, + "is_majority": true + }, + { + "symbol": "shape", + "index": 13, + "type": "triangle", + "color": [ + 255, + 0, + 255 + ], + "color_name": "magenta", + "center": [ + 895, + 429 + ], + "size": 36, + "is_majority": false + }, + { + "symbol": "shape", + "index": 14, + "type": "ellipse", + "color": [ + 255, + 255, + 0 + ], + "color_name": "yellow", + "center": [ + 460, + 245 + ], + "size": 104, + "is_majority": false + } + ] + }, + "param_hash": "a46ff06960c259f7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/majority_color_task/majority_color_00000002/prompt.txt b/VBVR-Dataset/majority_color_task/majority_color_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..64836033b97ab58a0dc085dedd12bfbd5ef2aa1d --- /dev/null +++ b/VBVR-Dataset/majority_color_task/majority_color_00000002/prompt.txt @@ -0,0 +1 @@ +The image shows multiple colored objects. Count how many objects are of each color. Identify the majority color (the color with the most objects). Then make all objects of other colors vanish, while the majority color objects remain stationary. \ No newline at end of file diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/final_frame.png b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3ca6192b6a8c9f5c5c979d40895f5013fa0adefe Binary files /dev/null and b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/final_frame.png differ diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/first_frame.png b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fbe62683db4415b8df53488876ce57f1a0db2921 Binary files /dev/null and b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/first_frame.png differ diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/ground_truth.mp4 b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e05fed2ef7ef9b63499d5b4117b49c832b20ec2f --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f657dd7b10bceabe4752f3d875373f838ae0e2143f42eaeb7d93b000e84d2d3 +size 272534 diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/metadata.json b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f68b2328ba3ebb98c66a0907ff91f8b1ee6c5610 --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/metadata.json @@ -0,0 +1,150 @@ +{ + "task_id": "mark_right_angled_triangles_00000000", + "generator": "mark_right_angled_triangles", + "timestamp": "2026-02-17T07:06:21.281374", + "parameters": { + "triangles": [ + { + "vertices": [ + [ + 346, + 323 + ], + [ + 346, + 434 + ], + [ + 428, + 323 + ] + ], + "color": [ + 140, + 93, + 150 + ] + }, + { + "vertices": [ + [ + 660, + 720 + ], + [ + 726, + 720 + ], + [ + 660, + 636 + ] + ], + "color": [ + 170, + 117, + 55 + ] + }, + { + "vertices": [ + [ + 423, + 610 + ], + [ + 423, + 692 + ], + [ + 530, + 610 + ] + ], + "color": [ + 145, + 162, + 198 + ] + }, + { + "vertices": [ + [ + 870, + 275 + ], + [ + 620, + 446 + ], + [ + 809, + 333 + ] + ], + "color": [ + 181, + 121, + 132 + ] + }, + { + "vertices": [ + [ + 845, + 436 + ], + [ + 724, + 439 + ], + [ + 842, + 485 + ] + ], + "color": [ + 94, + 178, + 58 + ] + }, + { + "vertices": [ + [ + 600, + 422 + ], + [ + 834, + 185 + ], + [ + 652, + 233 + ] + ], + "color": [ + 112, + 148, + 61 + ] + } + ], + "right_angled_indices": [ + 0, + 1, + 2 + ] + }, + "param_hash": "92a4522b65ae0a4b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/prompt.txt b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..86d0acc884f63e6db42b3c518ed35bcb5a60a0f4 --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows multiple triangles on a white background. Identify every triangle that has a right angle (90°) and mark each one with a red circle; each circle must enclose only that right-angled triangle, not any other shape. Show the solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/final_frame.png b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..92b22281c0caa21f73abc8775b7fcd2a52616eba Binary files /dev/null and b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/final_frame.png differ diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/first_frame.png b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..58dbbbb6186ab3a95878ca3143f0dccce6207573 Binary files /dev/null and b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/first_frame.png differ diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/ground_truth.mp4 b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b46f1bd6dba33eaa0c60c59d7256f89c2b0f10bc --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c202a5865b29f724a43d3a1fa0c192d67a942edcb169e95036c5217300668286 +size 318393 diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/metadata.json b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9cbbf3773d67b545f68c6fc828b0c6929ce29384 --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/metadata.json @@ -0,0 +1,190 @@ +{ + "task_id": "mark_right_angled_triangles_00000001", + "generator": "mark_right_angled_triangles", + "timestamp": "2026-02-17T07:06:22.012553", + "parameters": { + "triangles": [ + { + "vertices": [ + [ + 678, + 434 + ], + [ + 678, + 393 + ], + [ + 593, + 434 + ] + ], + "color": [ + 182, + 170, + 114 + ] + }, + { + "vertices": [ + [ + 857, + 882 + ], + [ + 763, + 296 + ], + [ + 845, + 322 + ] + ], + "color": [ + 131, + 67, + 137 + ] + }, + { + "vertices": [ + [ + 286, + 406 + ], + [ + 256, + 382 + ], + [ + 228, + 713 + ] + ], + "color": [ + 93, + 68, + 90 + ] + }, + { + "vertices": [ + [ + 518, + 437 + ], + [ + 382, + 288 + ], + [ + 462, + 811 + ] + ], + "color": [ + 88, + 93, + 85 + ] + }, + { + "vertices": [ + [ + 617, + 547 + ], + [ + 465, + 842 + ], + [ + 613, + 668 + ] + ], + "color": [ + 192, + 117, + 120 + ] + }, + { + "vertices": [ + [ + 272, + 186 + ], + [ + 157, + 313 + ], + [ + 377, + 287 + ] + ], + "color": [ + 99, + 121, + 191 + ] + }, + { + "vertices": [ + [ + 824, + 828 + ], + [ + 528, + 844 + ], + [ + 476, + 885 + ] + ], + "color": [ + 183, + 55, + 121 + ] + }, + { + "vertices": [ + [ + 760, + 177 + ], + [ + 252, + 173 + ], + [ + 628, + 212 + ] + ], + "color": [ + 87, + 162, + 69 + ] + } + ], + "right_angled_indices": [ + 0 + ] + }, + "param_hash": "134b46c3fa56a1ed", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/prompt.txt b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..86d0acc884f63e6db42b3c518ed35bcb5a60a0f4 --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows multiple triangles on a white background. Identify every triangle that has a right angle (90°) and mark each one with a red circle; each circle must enclose only that right-angled triangle, not any other shape. Show the solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/final_frame.png b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f217ba100e66d1eade12edb9a9fd3a67d6402a7d Binary files /dev/null and b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/final_frame.png differ diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/first_frame.png b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4fda70692a2e0270d535e7229259064fb15b91e0 Binary files /dev/null and b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/first_frame.png differ diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/ground_truth.mp4 b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3b5dbe0f2af0ed31f72d30fbe99ed97636b0eb4c --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c5b36101148b92be64699a9ca056b499796b3fb70a18ec01851ed326b1d0e7 +size 307351 diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/metadata.json b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fccb25ba5dd5288c1949cf23e8da2dac8ba8d5b2 --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/metadata.json @@ -0,0 +1,191 @@ +{ + "task_id": "mark_right_angled_triangles_00000002", + "generator": "mark_right_angled_triangles", + "timestamp": "2026-02-17T07:06:22.727063", + "parameters": { + "triangles": [ + { + "vertices": [ + [ + 596, + 456 + ], + [ + 596, + 336 + ], + [ + 540, + 456 + ] + ], + "color": [ + 138, + 68, + 56 + ] + }, + { + "vertices": [ + [ + 344, + 423 + ], + [ + 344, + 372 + ], + [ + 384, + 423 + ] + ], + "color": [ + 109, + 183, + 81 + ] + }, + { + "vertices": [ + [ + 586, + 835 + ], + [ + 286, + 837 + ], + [ + 212, + 634 + ] + ], + "color": [ + 113, + 77, + 179 + ] + }, + { + "vertices": [ + [ + 146, + 229 + ], + [ + 144, + 602 + ], + [ + 183, + 317 + ] + ], + "color": [ + 135, + 200, + 77 + ] + }, + { + "vertices": [ + [ + 861, + 831 + ], + [ + 878, + 333 + ], + [ + 714, + 622 + ] + ], + "color": [ + 99, + 175, + 73 + ] + }, + { + "vertices": [ + [ + 620, + 662 + ], + [ + 733, + 876 + ], + [ + 635, + 856 + ] + ], + "color": [ + 61, + 170, + 165 + ] + }, + { + "vertices": [ + [ + 703, + 162 + ], + [ + 640, + 144 + ], + [ + 885, + 136 + ] + ], + "color": [ + 65, + 193, + 142 + ] + }, + { + "vertices": [ + [ + 707, + 598 + ], + [ + 544, + 682 + ], + [ + 483, + 729 + ] + ], + "color": [ + 130, + 156, + 79 + ] + } + ], + "right_angled_indices": [ + 0, + 1 + ] + }, + "param_hash": "422b89d2ef10df78", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/prompt.txt b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..86d0acc884f63e6db42b3c518ed35bcb5a60a0f4 --- /dev/null +++ b/VBVR-Dataset/mark_right_angled_triangles_task/mark_right_angled_triangles_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows multiple triangles on a white background. Identify every triangle that has a right angle (90°) and mark each one with a red circle; each circle must enclose only that right-angled triangle, not any other shape. Show the solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/final_frame.png b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4c0405a1172a6acadb434cd1fa8d02d102fbb676 Binary files /dev/null and b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/final_frame.png differ diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/first_frame.png b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a588421179388798dec556b159ce9616e764f92d Binary files /dev/null and b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/first_frame.png differ diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/ground_truth.mp4 b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c90db3b8c3b5b06f504e615a43448aaf8760eff3 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec65f0c5e2c01ee8ca22c0ebba5cfb9455675b03cd4850703ecaadc1d3540f1 +size 304553 diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/metadata.json b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..246c4f580bdd1c298ceda5f77c11638420148d51 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "mark_tangent_point_after_motion_00000000", + "generator": "mark_tangent_point_after_motion", + "timestamp": "2026-02-17T06:59:05.265494", + "parameters": { + "circles": [ + { + "id": 0, + "color": "#55EFC4", + "radius": 73, + "start_position": [ + 143.738092, + 439 + ], + "final_position": [ + 512, + 439 + ] + }, + { + "id": 1, + "color": "#0984E3", + "radius": 94, + "start_position": [ + 880.261908, + 606 + ], + "final_position": [ + 512, + 606 + ] + } + ], + "tangent_point": [ + 512.0, + 512.0 + ] + }, + "param_hash": "373d891d4b962333", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/prompt.txt b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c2816419eab31e07d8ec38c8007334e53c41926 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows two circles that move only horizontally toward each other (left-to-right and right-to-left) until they touch and stop. First locate the single tangent point where the two circle boundaries meet, then draw a red circle around that tangent point. Show the complete marking process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/final_frame.png b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..70bdbd57de6a3ffae6eb7aa9dff2c092e37c9d99 Binary files /dev/null and b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/final_frame.png differ diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/first_frame.png b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fffbdf98707fc7a0519b1b1b1a2a9218fe1be88d Binary files /dev/null and b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/first_frame.png differ diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/ground_truth.mp4 b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ba13c09401059f4e6a942846a7de56243c4a1974 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcade2cfa540ec43657faf87116a3f2606effabf200f26db08da27d462d0c3ae +size 297112 diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/metadata.json b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dd8aca585c871a1cead07286da1cc11a72b63967 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "mark_tangent_point_after_motion_00000001", + "generator": "mark_tangent_point_after_motion", + "timestamp": "2026-02-17T06:59:06.275843", + "parameters": { + "circles": [ + { + "id": 0, + "color": "#2980B9", + "radius": 81, + "start_position": [ + 108.048464, + 431 + ], + "final_position": [ + 512, + 431 + ] + }, + { + "id": 1, + "color": "#E67E22", + "radius": 79, + "start_position": [ + 915.951536, + 591 + ], + "final_position": [ + 512, + 591 + ] + } + ], + "tangent_point": [ + 512.0, + 512.0 + ] + }, + "param_hash": "fe687107f4314246", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/prompt.txt b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c2816419eab31e07d8ec38c8007334e53c41926 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows two circles that move only horizontally toward each other (left-to-right and right-to-left) until they touch and stop. First locate the single tangent point where the two circle boundaries meet, then draw a red circle around that tangent point. Show the complete marking process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/final_frame.png b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dc244e0932c1e487d231af0549f9670034444f40 Binary files /dev/null and b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/final_frame.png differ diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/first_frame.png b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e6d061cb9ff335f849d097e727fc41457dd60490 Binary files /dev/null and b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/first_frame.png differ diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/ground_truth.mp4 b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8afc9c8e2e57cd553ee51a470fcf176c88569857 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7939564e23818faee3a8425e6a58890e73a52fe1c4c88426b83091c3d1c039a5 +size 310151 diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/metadata.json b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..32f9fc1cdf1668e511723a96637a42ee8cfc973d --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "mark_tangent_point_after_motion_00000002", + "generator": "mark_tangent_point_after_motion", + "timestamp": "2026-02-17T06:59:07.301383", + "parameters": { + "circles": [ + { + "id": 0, + "color": "#A29BFE", + "radius": 67, + "start_position": [ + 67, + 445 + ], + "final_position": [ + 512, + 445 + ] + }, + { + "id": 1, + "color": "#00B894", + "radius": 100, + "start_position": [ + 924, + 612 + ], + "final_position": [ + 512, + 612 + ] + } + ], + "tangent_point": [ + 512.0, + 512.0 + ] + }, + "param_hash": "42ebdec9a48efddb", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/prompt.txt b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8c2816419eab31e07d8ec38c8007334e53c41926 --- /dev/null +++ b/VBVR-Dataset/mark_tangent_point_after_motion_task/mark_tangent_point_after_motion_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows two circles that move only horizontally toward each other (left-to-right and right-to-left) until they touch and stop. First locate the single tangent point where the two circle boundaries meet, then draw a red circle around that tangent point. Show the complete marking process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/final_frame.png b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d3a7952c5b3ad3d04380960e0973e41e641f5faf Binary files /dev/null and b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/final_frame.png differ diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/first_frame.png b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..674f48c9f5ec50fdd962281a21006eb4a482ff53 Binary files /dev/null and b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/first_frame.png differ diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/ground_truth.mp4 b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f99e352d3f7432285b167381f3ef22edf15aa011 --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:208e55759c77482e93e1d725d93a23c75551583642e6a60cfbf0dd47fe8b5283 +size 166194 diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/metadata.json b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7d8a910e47d7ed1b0425f1106527ff3f68f38de1 --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/metadata.json @@ -0,0 +1,48 @@ +{ + "task_id": "mirror_reflection_00000000", + "generator": "mirror_reflection", + "timestamp": "2026-02-17T07:41:32.983182", + "parameters": { + "reflectivity": 0.93609, + "theta_incident_degrees": 63.391636, + "theta_reflected_degrees": 63.391636, + "objects": [ + { + "symbol": "ray", + "start": [ + -410.256407, + 50 + ], + "end": [ + 512, + 512 + ], + "type": "incident", + "angle_degrees": 63.391636 + }, + { + "symbol": "ray", + "start": [ + 512, + 512 + ], + "end": [ + 1024, + 255.516013 + ], + "type": "reflected", + "angle_degrees": 63.391636 + } + ] + }, + "param_hash": "2ad17b000dd655dd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/prompt.txt b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..81b4ec9f8dc23b976d23ae289baeb8ff3d9da35c --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000000/prompt.txt @@ -0,0 +1 @@ +Given the mirror reflectivity = 0.94, predict the light reflection from the mirror surface. The reflected ray must extend all the way to the edge of the image. \ No newline at end of file diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/final_frame.png b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..78efeaea9fae8462ac5cd84c811e628511edfc3c Binary files /dev/null and b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/final_frame.png differ diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/first_frame.png b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..013a8606b04a2edaa3a7843f6fe7181a0ade0684 Binary files /dev/null and b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/first_frame.png differ diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/ground_truth.mp4 b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..87e13bd54f4ccdea013a850d21abc24516480348 --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be276ff4d3dac3c83348547b4f1513a56c83a83dd30ff434d171a8f42034e8e +size 202818 diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/metadata.json b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9383b49335a4b41a1511cf0a90e26590ac433ebc --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/metadata.json @@ -0,0 +1,48 @@ +{ + "task_id": "mirror_reflection_00000001", + "generator": "mirror_reflection", + "timestamp": "2026-02-17T07:41:33.379320", + "parameters": { + "reflectivity": 0.367415, + "theta_incident_degrees": 54.811779, + "theta_reflected_degrees": 54.811779, + "objects": [ + { + "symbol": "ray", + "start": [ + -143.212676, + 50 + ], + "end": [ + 512, + 512 + ], + "type": "incident", + "angle_degrees": 54.811779 + }, + { + "symbol": "ray", + "start": [ + 512, + 512 + ], + "end": [ + 1024, + 150.981343 + ], + "type": "reflected", + "angle_degrees": 54.811779 + } + ] + }, + "param_hash": "5e61301310aa35f9", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/prompt.txt b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c87c5e6bb9a99611b83039766b5cf2f825cbf5c3 --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000001/prompt.txt @@ -0,0 +1 @@ +Given the mirror reflectivity = 0.37, predict the light reflection from the mirror surface. The reflected ray must extend all the way to the edge of the image. \ No newline at end of file diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/final_frame.png b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..46439c8b0b4e9728b7dd9119e885b286ce4bca93 Binary files /dev/null and b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/final_frame.png differ diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/first_frame.png b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..85fc7a464f65ca63df7cc6d87189f965621575eb Binary files /dev/null and b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/first_frame.png differ diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/ground_truth.mp4 b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..fb1aa5ad39acc9666a18a249cc52c0f51b4372ca --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86db8ed37596bb6a9fe8978ff77c79b368116c9a34743708f5a63f675e2c8b33 +size 195761 diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/metadata.json b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..332c6fc3b6f93f03b76d95b190e59c52d53feeee --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/metadata.json @@ -0,0 +1,48 @@ +{ + "task_id": "mirror_reflection_00000002", + "generator": "mirror_reflection", + "timestamp": "2026-02-17T07:41:33.786121", + "parameters": { + "reflectivity": 0.863874, + "theta_incident_degrees": 61.333245, + "theta_reflected_degrees": 61.333245, + "objects": [ + { + "symbol": "ray", + "start": [ + -333.023898, + 50 + ], + "end": [ + 512, + 512 + ], + "type": "incident", + "angle_degrees": 61.333245 + }, + { + "symbol": "ray", + "start": [ + 512, + 512 + ], + "end": [ + 1024, + 232.074189 + ], + "type": "reflected", + "angle_degrees": 61.333245 + } + ] + }, + "param_hash": "4fa537bb92abd4ef", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/prompt.txt b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..dff9ee29f4f0727fdaeb1b13e7a1c3b8d78ff4ba --- /dev/null +++ b/VBVR-Dataset/mirror_reflection_task/mirror_reflection_00000002/prompt.txt @@ -0,0 +1 @@ +Given the mirror reflectivity = 0.86, predict how light reflects when it encounters the mirror. Extend the reflected ray to the image boundary. \ No newline at end of file diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/final_frame.png b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2708456a015d3dae91ca5e6d0ff2f7f2d3175c78 Binary files /dev/null and b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/final_frame.png differ diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/first_frame.png b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8472775712bd88c1e82965a3475bc910b8c499e9 Binary files /dev/null and b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/first_frame.png differ diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/ground_truth.mp4 b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c5984426cb9076fc6f6921bee0b4f941dd51dc1d --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d23580b720d3c64b9dcf19d3f615d1dcd3b41908ca69138e1a26e241ad212b +size 150298 diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/metadata.json b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1691a28ecfcc3b08811be828278135a90ec0ae65 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "multi_object_placement_00000000", + "generator": "multi_object_placement", + "timestamp": "2026-02-17T07:34:09.545922", + "parameters": { + "objects": [ + { + "id": 0, + "shape": "rectangle", + "color": "red", + "size": 91, + "position": [ + 803, + 559 + ] + }, + { + "id": 1, + "shape": "circle", + "color": "green", + "size": 56, + "position": [ + 334, + 622 + ] + }, + { + "id": 2, + "shape": "square", + "color": "purple", + "size": 56, + "position": [ + 207, + 133 + ] + } + ], + "markers": [ + { + "id": 0, + "color": "red", + "size": 28, + "position": [ + 433, + 252 + ] + }, + { + "id": 1, + "color": "green", + "size": 28, + "position": [ + 564, + 669 + ] + }, + { + "id": 2, + "color": "purple", + "size": 28, + "position": [ + 749, + 251 + ] + } + ] + }, + "param_hash": "2493334cc151a347", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/prompt.txt b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8df74f9576590ddb68e4b0582ccaf1ae568674d1 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000000/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple colored objects and star markers. Keep all star markers unchanged in position. Move each colored object to the star marker with the same color using straight paths, aligning the center of each object with the center of its matching star marker. \ No newline at end of file diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/final_frame.png b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4ca83bc5193e8c7d0e705324e42abb490f7a49fb Binary files /dev/null and b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/final_frame.png differ diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/first_frame.png b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..56e1d664fb566ec649c7d86ece96a65b04a647a2 Binary files /dev/null and b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/first_frame.png differ diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/ground_truth.mp4 b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..bd142f3119895b2f9a9d542eb5ef313eb1d1ae58 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d694a620cbdc73c96f5b3bf4716fc0899d23e52eccfa2d5bab9f1e0066476c +size 150414 diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/metadata.json b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..87c670ac350924174a07dfa3786705c720c73253 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "multi_object_placement_00000001", + "generator": "multi_object_placement", + "timestamp": "2026-02-17T07:34:10.093280", + "parameters": { + "objects": [ + { + "id": 0, + "shape": "circle", + "color": "orange", + "size": 56, + "position": [ + 151, + 908 + ] + }, + { + "id": 1, + "shape": "square", + "color": "purple", + "size": 56, + "position": [ + 461, + 550 + ] + }, + { + "id": 2, + "shape": "rectangle", + "color": "green", + "size": 91, + "position": [ + 883, + 518 + ] + } + ], + "markers": [ + { + "id": 0, + "color": "orange", + "size": 28, + "position": [ + 251, + 292 + ] + }, + { + "id": 1, + "color": "purple", + "size": 28, + "position": [ + 640, + 388 + ] + }, + { + "id": 2, + "color": "green", + "size": 28, + "position": [ + 659, + 750 + ] + } + ] + }, + "param_hash": "e7f90d5c7a73ca1d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/prompt.txt b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8df74f9576590ddb68e4b0582ccaf1ae568674d1 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000001/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple colored objects and star markers. Keep all star markers unchanged in position. Move each colored object to the star marker with the same color using straight paths, aligning the center of each object with the center of its matching star marker. \ No newline at end of file diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/final_frame.png b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4951540cf4047aa315023b4f14cf2ed65498d1f9 Binary files /dev/null and b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/final_frame.png differ diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/first_frame.png b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2633c42682e25dc5e1c6c4717d41a17ada41f06e Binary files /dev/null and b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/first_frame.png differ diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/ground_truth.mp4 b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c81a0ca056964195944c6705669172111590bad7 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3cff9f47eb4700da9fafe0644c4bc4a07329c5648cf26bc6522067f6e59aa1 +size 148303 diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/metadata.json b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..164ac1bbcfd0e8723aa1eb56fb0422b0ac3bb3b6 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "multi_object_placement_00000002", + "generator": "multi_object_placement", + "timestamp": "2026-02-17T07:34:10.637481", + "parameters": { + "objects": [ + { + "id": 0, + "shape": "triangle", + "color": "orange", + "size": 56, + "position": [ + 198, + 275 + ] + }, + { + "id": 1, + "shape": "rectangle", + "color": "red", + "size": 91, + "position": [ + 207, + 631 + ] + }, + { + "id": 2, + "shape": "square", + "color": "green", + "size": 56, + "position": [ + 916, + 874 + ] + } + ], + "markers": [ + { + "id": 0, + "color": "orange", + "size": 28, + "position": [ + 719, + 307 + ] + }, + { + "id": 1, + "color": "red", + "size": 28, + "position": [ + 646, + 630 + ] + }, + { + "id": 2, + "color": "green", + "size": 28, + "position": [ + 402, + 443 + ] + } + ] + }, + "param_hash": "52eca237dc68278a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/prompt.txt b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8df74f9576590ddb68e4b0582ccaf1ae568674d1 --- /dev/null +++ b/VBVR-Dataset/multi_object_placement_task/multi_object_placement_00000002/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple colored objects and star markers. Keep all star markers unchanged in position. Move each colored object to the star marker with the same color using straight paths, aligning the center of each object with the center of its matching star marker. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/final_frame.png b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5ec8ad11edc4ede4cb2831146a28059c5299b8ef Binary files /dev/null and b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/final_frame.png differ diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/first_frame.png b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fccfc5858a3646eab7588c39431885afec3b0ac7 Binary files /dev/null and b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/first_frame.png differ diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/ground_truth.mp4 b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f6f70c1156fc8f6b0c85a05e86b8403b60af72b6 --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854c597883667ae798a8de2b17138437618350e479547c0870e018e5b692ccd7 +size 270642 diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/metadata.json b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3d48071b3ab1c0426ce2453571afa36c6c96189d --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/metadata.json @@ -0,0 +1,112 @@ +{ + "task_id": "multiple_bounces_00000000", + "generator": "multiple_bounces", + "timestamp": "2026-02-17T07:30:50.905037", + "parameters": { + "ball": { + "x": 448, + "y": 277.855515, + "color": [ + 0, + 0, + 0 + ] + }, + "targets": [ + { + "id": 1, + "x": 576, + "y": 403.748571, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 2, + "x": 576, + "y": 469.577143, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 3, + "x": 576, + "y": 535.405714, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 4, + "x": 576, + "y": 601.234286, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 5, + "x": 576, + "y": 667.062857, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 6, + "x": 576, + "y": 732.891429, + "color": [ + 255, + 0, + 0 + ] + } + ], + "hit_target_id": 1, + "bounce_points": [ + [ + 448.0, + 277.855515 + ], + [ + 581, + 318.29942 + ], + [ + 443, + 360.263772 + ], + [ + 581, + 402.228124 + ], + [ + 576.0, + 403.748571 + ] + ], + "wall_distance": 164 + }, + "param_hash": "bd964b74668df4fd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/prompt.txt b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6336440689aa810c48c2ab8efb688cd20082f15 --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000000/prompt.txt @@ -0,0 +1 @@ +A black ball starts with the shown initial direction arrow. It moves in straight lines and reflects off the two vertical walls following the law of reflection (the angle of reflection equals the angle of incidence). Follow this unique trajectory until the ball hits one of the red hollow circle targets in the lower-right area. Identify which target circle is hit and show the full trajectory step by step. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/final_frame.png b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1cf00bd02ac12faee7a2cdb48dc92f87a5aec4a9 Binary files /dev/null and b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/final_frame.png differ diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/first_frame.png b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bd471ff6f177ad1a84bbf2e776f6073b1b4f0337 Binary files /dev/null and b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/first_frame.png differ diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/ground_truth.mp4 b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..552410f18c7f5a76003aac42e587d097af3c40cb --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07190a925d316857e79c739cb803111b33837293d48b708fa0cfa3502fa748bb +size 287545 diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/metadata.json b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..30e0e53c4861a1ab1729a6257c5e8e61a4c3eb9c --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/metadata.json @@ -0,0 +1,112 @@ +{ + "task_id": "multiple_bounces_00000001", + "generator": "multiple_bounces", + "timestamp": "2026-02-17T07:30:51.991775", + "parameters": { + "ball": { + "x": 341, + "y": 282.828059, + "color": [ + 0, + 0, + 0 + ] + }, + "targets": [ + { + "id": 1, + "x": 683, + "y": 403.748571, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 2, + "x": 683, + "y": 469.577143, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 3, + "x": 683, + "y": 535.405714, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 4, + "x": 683, + "y": 601.234286, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 5, + "x": 683, + "y": 667.062857, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 6, + "x": 683, + "y": 732.891429, + "color": [ + 255, + 0, + 0 + ] + } + ], + "hit_target_id": 3, + "bounce_points": [ + [ + 341.0, + 282.828059 + ], + [ + 688, + 365.824694 + ], + [ + 336, + 450.017246 + ], + [ + 688, + 534.209797 + ], + [ + 683.0, + 535.405714 + ] + ], + "wall_distance": 378 + }, + "param_hash": "6fb5d8c9f2005782", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/prompt.txt b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6336440689aa810c48c2ab8efb688cd20082f15 --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000001/prompt.txt @@ -0,0 +1 @@ +A black ball starts with the shown initial direction arrow. It moves in straight lines and reflects off the two vertical walls following the law of reflection (the angle of reflection equals the angle of incidence). Follow this unique trajectory until the ball hits one of the red hollow circle targets in the lower-right area. Identify which target circle is hit and show the full trajectory step by step. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/final_frame.png b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e5ddbb91c07f7008924d3a2acdad5e45c49f9a76 Binary files /dev/null and b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/final_frame.png differ diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/first_frame.png b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8de78c847ea82d322bd972a8eed0ee5d2d64a205 Binary files /dev/null and b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/first_frame.png differ diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/ground_truth.mp4 b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..460edc53c378f863407ba94296851e9b40b193dc --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875f210351f3dcfe0832bcaeae8a6a1fcdcc3c38c176c252c9fca16b0bb156c8 +size 251744 diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/metadata.json b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0a21f906a6dceab4653996f914820ff04ea3af3c --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/metadata.json @@ -0,0 +1,118 @@ +{ + "task_id": "multiple_bounces_00000002", + "generator": "multiple_bounces", + "timestamp": "2026-02-17T07:30:53.042320", + "parameters": { + "ball": { + "x": 495, + "y": 248.658497, + "color": [ + 0, + 0, + 0 + ] + }, + "targets": [ + { + "id": 1, + "x": 529, + "y": 414.72, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 2, + "x": 529, + "y": 491.52, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 3, + "x": 529, + "y": 568.32, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 4, + "x": 529, + "y": 645.12, + "color": [ + 255, + 0, + 0 + ] + }, + { + "id": 5, + "x": 529, + "y": 721.92, + "color": [ + 255, + 0, + 0 + ] + } + ], + "hit_target_id": 1, + "bounce_points": [ + [ + 495.0, + 248.658497 + ], + [ + 534, + 269.685765 + ], + [ + 490, + 293.408837 + ], + [ + 534, + 317.131909 + ], + [ + 490, + 340.854981 + ], + [ + 534, + 364.578053 + ], + [ + 490, + 388.301124 + ], + [ + 534, + 412.024196 + ], + [ + 529.0, + 414.72 + ] + ], + "wall_distance": 70 + }, + "param_hash": "52b43c3a57f089d6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/prompt.txt b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6336440689aa810c48c2ab8efb688cd20082f15 --- /dev/null +++ b/VBVR-Dataset/multiple_bounces_task/multiple_bounces_00000002/prompt.txt @@ -0,0 +1 @@ +A black ball starts with the shown initial direction arrow. It moves in straight lines and reflects off the two vertical walls following the law of reflection (the angle of reflection equals the angle of incidence). Follow this unique trajectory until the ball hits one of the red hollow circle targets in the lower-right area. Identify which target circle is hit and show the full trajectory step by step. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/final_frame.png b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d17afb973e01c2af405a6d1e7afcf63aa8d698b1 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/final_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/first_frame.png b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b34ee2890cc95d6f309ef9b4532a77f6d18df8f2 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/first_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/ground_truth.mp4 b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e2d1a41f5ea1787781fb6beab0054d2674da3079 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499d137b6db97c0ae84f935307b78b9f1b1edd86528d683e79619c54564ff714 +size 102201 diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/metadata.json b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5ca601abd9327f23e786c8daaaa688dc47fef952 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "multiple_occlusions_00000000", + "generator": "multiple_occlusions", + "timestamp": "2026-02-17T07:23:39.749484", + "parameters": { + "objects": [ + { + "shape": "square", + "color": [ + 150, + 78, + 213 + ], + "size": 127, + "id": 1, + "position": [ + 544, + 512 + ] + }, + { + "shape": "triangle", + "color": [ + 242, + 127, + 163 + ], + "size": 142, + "id": 2, + "position": [ + 690, + 512 + ] + }, + { + "shape": "circle", + "color": [ + 68, + 220, + 192 + ], + "size": 161, + "id": 3, + "position": [ + 852, + 512 + ] + } + ] + }, + "param_hash": "a97425cc50adbeb5", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/prompt.txt b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ec187f11408abe163393bd001c895a6515b260e --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 objects arranged horizontally on the right side of the frame, with a dark rectangular mask initially positioned on the left side. Move the mask horizontally to the right in a continuous motion until it leaves the frame. As it moves, the mask passes in front of the objects, temporarily blocking them from view. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/final_frame.png b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..59aa4647069c7359f52013dd7fba7ea4171e021e Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/final_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/first_frame.png b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b15d543402ad9bbe5a73332441978dc950402d08 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/first_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/ground_truth.mp4 b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..62e77700d1d5bda172b77ce5f2fa5d4dbd4937bc --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09e448c7626b4e87eadcdfb21916b31f836ab1a92188775cb991766dc70740e +size 126447 diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/metadata.json b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0ada6e8807ed0f3c107013e42d18f6bace9bdbd8 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/metadata.json @@ -0,0 +1,75 @@ +{ + "task_id": "multiple_occlusions_00000001", + "generator": "multiple_occlusions", + "timestamp": "2026-02-17T07:23:40.180661", + "parameters": { + "objects": [ + { + "shape": "triangle", + "color": [ + 205, + 51, + 83 + ], + "size": 121, + "id": 1, + "position": [ + 470, + 512 + ] + }, + { + "shape": "circle", + "color": [ + 159, + 217, + 88 + ], + "size": 123, + "id": 2, + "position": [ + 610, + 512 + ] + }, + { + "shape": "square", + "color": [ + 187, + 215, + 199 + ], + "size": 141, + "id": 3, + "position": [ + 752, + 512 + ] + }, + { + "shape": "pentagram", + "color": [ + 198, + 168, + 102 + ], + "size": 167, + "id": 4, + "position": [ + 912, + 512 + ] + } + ] + }, + "param_hash": "0fdbc5710d62f6b5", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/prompt.txt b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..1864e81d6227f1d3d7ca19b41cc30b80594dbec6 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 objects arranged horizontally on the right side of the frame, with a dark rectangular mask initially positioned on the left side. Move the mask horizontally to the right in a continuous motion until it leaves the frame. As it moves, the mask passes in front of the objects, temporarily blocking them from view. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/final_frame.png b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..18a104fc2402e5f6fec91687ed21f9e35d1b43e0 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/final_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/first_frame.png b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..909610f83e0aeaa1743add0e0b94708eae988885 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/first_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/ground_truth.mp4 b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..15ce5464fa1e0538f5cbce3a1ae38f230da81c9f --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7f221dbb72037c7bc30a14bd3d8372857e12f21a484e6e0a18975c43577c47 +size 103287 diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/metadata.json b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1267a9aa97317a1076b13022989d94ebdfb4c6b3 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "multiple_occlusions_00000002", + "generator": "multiple_occlusions", + "timestamp": "2026-02-17T07:23:40.601425", + "parameters": { + "objects": [ + { + "shape": "triangle", + "color": [ + 157, + 233, + 231 + ], + "size": 143, + "id": 1, + "position": [ + 520, + 512 + ] + }, + { + "shape": "square", + "color": [ + 170, + 208, + 117 + ], + "size": 174, + "id": 2, + "position": [ + 682, + 512 + ] + }, + { + "shape": "circle", + "color": [ + 93, + 140, + 134 + ], + "size": 178, + "id": 3, + "position": [ + 876, + 512 + ] + } + ] + }, + "param_hash": "87870265ebaccccd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/prompt.txt b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ec187f11408abe163393bd001c895a6515b260e --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_task/multiple_occlusions_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 objects arranged horizontally on the right side of the frame, with a dark rectangular mask initially positioned on the left side. Move the mask horizontally to the right in a continuous motion until it leaves the frame. As it moves, the mask passes in front of the objects, temporarily blocking them from view. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/final_frame.png b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b7b38abe50f8fec70615751193484dc3d72a2815 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/final_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/first_frame.png b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d71c098840b31050b34b089f8f287c8e2e68f94a Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/first_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/ground_truth.mp4 b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..99d80e6db707dd48c0027da4b661214b866e8809 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52443972ef41f53a5cf480c15cf4cc33c6093359686402694ac9744aedb5723 +size 178969 diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/metadata.json b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..28696f152bf5feeb4a2e5e203ac6f54da0e40b2f --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "multiple_occlusions_vertical_00000000", + "generator": "multiple_occlusions_vertical", + "timestamp": "2026-02-17T07:12:17.468227", + "parameters": { + "objects": [ + { + "id": 1, + "type": "star", + "color": "#99353D", + "size": 100, + "position": [ + 296, + 511 + ] + }, + { + "id": 2, + "type": "circle", + "color": "#358899", + "size": 100, + "position": [ + 512, + 511 + ] + }, + { + "id": 3, + "type": "star", + "color": "#2DE554", + "size": 100, + "position": [ + 728, + 511 + ] + } + ] + }, + "param_hash": "bf83aec8e67a0d98", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/prompt.txt b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d7896389f6bd934dc8cf14b999481553c946ee0 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 objects arranged in a horizontal line in the center of the frame, with a dark rectangular mask initially positioned above them. Move the mask vertically downward in a continuous motion until it leaves the frame. As it moves, the mask passes in front of the objects, temporarily blocking them from view. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/final_frame.png b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3612c937d064c99e239b0c71c261cd34d3e34a6a Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/final_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/first_frame.png b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e3bb220c0f03714350d4130604bbf68d616b6698 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/first_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/ground_truth.mp4 b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6dbbbfe6edfa7a3b0160dd28f6e597e16cd01a97 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b432c1eb49a1b1295c0682735ef4d52707b74d80409c4aab1854b3ffb14217 +size 182889 diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/metadata.json b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a65b4f98ead79e57b4b20d3399854d2fa0710b49 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/metadata.json @@ -0,0 +1,59 @@ +{ + "task_id": "multiple_occlusions_vertical_00000001", + "generator": "multiple_occlusions_vertical", + "timestamp": "2026-02-17T07:12:18.191471", + "parameters": { + "objects": [ + { + "id": 1, + "type": "diamond", + "color": "#35995E", + "size": 100, + "position": [ + 296, + 511 + ] + }, + { + "id": 2, + "type": "square", + "color": "#50B9E5", + "size": 100, + "position": [ + 440, + 511 + ] + }, + { + "id": 3, + "type": "circle", + "color": "#5650E5", + "size": 100, + "position": [ + 584, + 511 + ] + }, + { + "id": 4, + "type": "hexagon", + "color": "#70991E", + "size": 100, + "position": [ + 728, + 511 + ] + } + ] + }, + "param_hash": "bd3d4ddad2829166", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/prompt.txt b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c5e77bd8b67e17ba464b8bb8a5eef9d6ef7024d --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 objects arranged in a horizontal line in the center of the frame, with a dark rectangular mask initially positioned above them. Move the mask vertically downward in a continuous motion until it leaves the frame. As it moves, the mask passes in front of the objects, temporarily blocking them from view. \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/final_frame.png b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..16aa05f11857e2450f167ba0f59f9562588ffae9 Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/final_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/first_frame.png b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b3de16ca01e0a137abb40139c5dc9a702cbfde2a Binary files /dev/null and b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/first_frame.png differ diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/ground_truth.mp4 b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..265278d97977026b1414664b8f99f7dcabd4b145 --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea1eac40fb0d7076bf318423ebf0ac8177b715b39e85c6201770b4db539f217 +size 184396 diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/metadata.json b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..2ebdd60460a47a5c462619532713e3e6a3d9450e --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/metadata.json @@ -0,0 +1,59 @@ +{ + "task_id": "multiple_occlusions_vertical_00000002", + "generator": "multiple_occlusions_vertical", + "timestamp": "2026-02-17T07:12:18.897952", + "parameters": { + "objects": [ + { + "id": 1, + "type": "triangle", + "color": "#1E8E99", + "size": 100, + "position": [ + 296, + 511 + ] + }, + { + "id": 2, + "type": "circle", + "color": "#99471E", + "size": 100, + "position": [ + 440, + 511 + ] + }, + { + "id": 3, + "type": "circle", + "color": "#5F994C", + "size": 100, + "position": [ + 584, + 511 + ] + }, + { + "id": 4, + "type": "diamond", + "color": "#72E5BA", + "size": 100, + "position": [ + 728, + 511 + ] + } + ] + }, + "param_hash": "389e6776e23904bf", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/prompt.txt b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6c5e77bd8b67e17ba464b8bb8a5eef9d6ef7024d --- /dev/null +++ b/VBVR-Dataset/multiple_occlusions_vertical_task/multiple_occlusions_vertical_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 objects arranged in a horizontal line in the center of the frame, with a dark rectangular mask initially positioned above them. Move the mask vertically downward in a continuous motion until it leaves the frame. As it moves, the mask passes in front of the objects, temporarily blocking them from view. \ No newline at end of file diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000000/final_frame.png b/VBVR-Dataset/object_packing_task/object_packing_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..60438ec0c149e4c1db8e2753bf07993cd52770d0 Binary files /dev/null and b/VBVR-Dataset/object_packing_task/object_packing_00000000/final_frame.png differ diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000000/first_frame.png b/VBVR-Dataset/object_packing_task/object_packing_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e296497fde8e2f18f0414c1726f2ff73cf19f0ae Binary files /dev/null and b/VBVR-Dataset/object_packing_task/object_packing_00000000/first_frame.png differ diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000000/ground_truth.mp4 b/VBVR-Dataset/object_packing_task/object_packing_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3f8de29665972500c226db5d100fae2e2efd3f2f --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53cc8895cd8118c66dfde14f7ad2774282408fd99da5c6b47ef65c9cab3a6b25 +size 135737 diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000000/metadata.json b/VBVR-Dataset/object_packing_task/object_packing_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1afb00c9f8a61e9fceac83d7154f27738c8e27e4 --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000000/metadata.json @@ -0,0 +1,68 @@ +{ + "task_id": "object_packing_00000000", + "generator": "object_packing", + "timestamp": "2026-02-17T07:22:51.132086", + "parameters": { + "object_size": 81, + "objects": [ + { + "color": "brown", + "shape": "pentagon", + "position": [ + 102, + 409 + ], + "final_position": [ + 614, + 410 + ] + }, + { + "color": "green", + "shape": "diamond", + "position": [ + 224, + 409 + ], + "final_position": [ + 716, + 410 + ] + }, + { + "color": "red", + "shape": "triangle", + "position": [ + 163, + 614 + ], + "final_position": [ + 614, + 512 + ] + } + ], + "container": { + "position": [ + 716, + 512 + ], + "size": 307 + }, + "color_order": [ + "brown", + "red", + "green" + ] + }, + "param_hash": "1cc3ca31325bf2af", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000000/prompt.txt b/VBVR-Dataset/object_packing_task/object_packing_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..156ec57bdad881bedbb7f0f737a65ce1b6ee49b2 --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows objects on the left side and a container on the right side. Place the objects into the container one by one in the color order: brown - red - green. Each object must be placed individually in the exact order specified, and all objects must end up inside the container. \ No newline at end of file diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000001/final_frame.png b/VBVR-Dataset/object_packing_task/object_packing_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f56444592c9b65f8833c277a749daccbaa25e334 Binary files /dev/null and b/VBVR-Dataset/object_packing_task/object_packing_00000001/final_frame.png differ diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000001/first_frame.png b/VBVR-Dataset/object_packing_task/object_packing_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3db57bd4eed60218947e8cf5c99608e8426bb719 Binary files /dev/null and b/VBVR-Dataset/object_packing_task/object_packing_00000001/first_frame.png differ diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000001/ground_truth.mp4 b/VBVR-Dataset/object_packing_task/object_packing_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..db6868405c9eca338b6c52eec36380624d0622f4 --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab1359dc3e6f9fb94b1dcca6a9a26167b48093822221c97e36492e2b69dc243 +size 137350 diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000001/metadata.json b/VBVR-Dataset/object_packing_task/object_packing_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..32dca2cfdc136269baee6ece077b00d3e2d0ecce --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000001/metadata.json @@ -0,0 +1,68 @@ +{ + "task_id": "object_packing_00000001", + "generator": "object_packing", + "timestamp": "2026-02-17T07:22:51.461196", + "parameters": { + "object_size": 81, + "objects": [ + { + "color": "pink", + "shape": "circle", + "position": [ + 102, + 409 + ], + "final_position": [ + 614, + 410 + ] + }, + { + "color": "green", + "shape": "diamond", + "position": [ + 224, + 409 + ], + "final_position": [ + 716, + 410 + ] + }, + { + "color": "orange", + "shape": "pentagon", + "position": [ + 163, + 614 + ], + "final_position": [ + 614, + 512 + ] + } + ], + "container": { + "position": [ + 716, + 512 + ], + "size": 307 + }, + "color_order": [ + "green", + "pink", + "orange" + ] + }, + "param_hash": "ff6b430ecd4cfabe", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000001/prompt.txt b/VBVR-Dataset/object_packing_task/object_packing_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..b112dc873c5fd7f5e932a1207e7a353a754b009c --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows objects on the left side and a container on the right side. Place the objects into the container one by one in the color order: green - pink - orange. Each object must be placed individually in the exact order specified, and all objects must end up inside the container. \ No newline at end of file diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000002/final_frame.png b/VBVR-Dataset/object_packing_task/object_packing_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..209f9aa7c228aa6dcecc80fbc962dbf4db4990c1 Binary files /dev/null and b/VBVR-Dataset/object_packing_task/object_packing_00000002/final_frame.png differ diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000002/first_frame.png b/VBVR-Dataset/object_packing_task/object_packing_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0ce88f5bac596be10219b5efce21ac64c88ea327 Binary files /dev/null and b/VBVR-Dataset/object_packing_task/object_packing_00000002/first_frame.png differ diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000002/ground_truth.mp4 b/VBVR-Dataset/object_packing_task/object_packing_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0dcc77ef39170078c817d4f524e58d18626883e1 --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3a282283ed6b7acfe49aaaaa393c468ded4d51f80e93bdeaf6a6f472c9dfc5 +size 135283 diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000002/metadata.json b/VBVR-Dataset/object_packing_task/object_packing_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4168cba861f4a436f625aa8abe46520e44b21e --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000002/metadata.json @@ -0,0 +1,81 @@ +{ + "task_id": "object_packing_00000002", + "generator": "object_packing", + "timestamp": "2026-02-17T07:22:51.809745", + "parameters": { + "object_size": 81, + "objects": [ + { + "color": "red", + "shape": "star", + "position": [ + 102, + 409 + ], + "final_position": [ + 614, + 410 + ] + }, + { + "color": "blue", + "shape": "pentagon", + "position": [ + 224, + 409 + ], + "final_position": [ + 716, + 410 + ] + }, + { + "color": "brown", + "shape": "square", + "position": [ + 102, + 614 + ], + "final_position": [ + 614, + 512 + ] + }, + { + "color": "pink", + "shape": "circle", + "position": [ + 224, + 614 + ], + "final_position": [ + 716, + 512 + ] + } + ], + "container": { + "position": [ + 716, + 512 + ], + "size": 307 + }, + "color_order": [ + "red", + "pink", + "brown", + "blue" + ] + }, + "param_hash": "abcef60691b921ec", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/object_packing_task/object_packing_00000002/prompt.txt b/VBVR-Dataset/object_packing_task/object_packing_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e666de1ac78818ddf2b5bedb892ed9e7b34e77b1 --- /dev/null +++ b/VBVR-Dataset/object_packing_task/object_packing_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows objects on the left side and a container on the right side. Place the objects into the container one by one in the color order: red - pink - brown - blue. Each object must be placed individually in the exact order specified, and all objects must end up inside the container. \ No newline at end of file diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/final_frame.png b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3e9b7db8e4a9d99864d34a31c5a4579cd19ad848 Binary files /dev/null and b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/final_frame.png differ diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/first_frame.png b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..208500ffeee4704cde72853aeca00dc32d2aedc9 Binary files /dev/null and b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/first_frame.png differ diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/ground_truth.mp4 b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..fa94e42dfea599999a6822c836fef024a9581430 --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b65e5e792a5a5b69965b195f24924137d78fe7af0035cdc0600367538eb053 +size 204735 diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/metadata.json b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fcca7b2888cc606d46635f449fb53175e92d87ce --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/metadata.json @@ -0,0 +1,27 @@ +{ + "task_id": "object_trajectory_00000000", + "generator": "object_trajectory", + "timestamp": "2026-02-17T07:07:55.923428", + "parameters": { + "start_pos": [ + 288, + 877 + ], + "end_pos": [ + 835, + 629 + ], + "ball_color": "#4a44c0", + "shape": "triangle" + }, + "param_hash": "1f53619bedd21a1f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/prompt.txt b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f3b9bc54dace2b7951b47c7fc416cafd1e629ba --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000000/prompt.txt @@ -0,0 +1 @@ +The scene contains a triangle object and a dashed target position (indicated by a dashed outline of the same shape). Keep the dashed target position unchanged. Move the triangle object to the dashed target position along the shortest path, ensuring it completely overlaps with the target. \ No newline at end of file diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/final_frame.png b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a0cff8402b01dcd191e797b0c6c7e8cece50542a Binary files /dev/null and b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/final_frame.png differ diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/first_frame.png b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..046f2d57feded70beaab3787927ef21fd3440260 Binary files /dev/null and b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/first_frame.png differ diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/ground_truth.mp4 b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b12eb9e30865946c2f8652d28b132b486100042e --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4553f6e52d108441cbd61adaa7d70c2d9b9bfd6801f7d48d301edb4cae9d97af +size 174706 diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/metadata.json b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa0f385099532d862f5359ca9095dd99cf7b446 --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/metadata.json @@ -0,0 +1,27 @@ +{ + "task_id": "object_trajectory_00000001", + "generator": "object_trajectory", + "timestamp": "2026-02-17T07:07:56.605589", + "parameters": { + "start_pos": [ + 928, + 917 + ], + "end_pos": [ + 722, + 592 + ], + "ball_color": "#558277", + "shape": "circle" + }, + "param_hash": "6b58abb06a3e0d27", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/prompt.txt b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2c9d8456668022597f20cd36517cb9ae486ca391 --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000001/prompt.txt @@ -0,0 +1 @@ +The scene contains a circle object and a dashed target position (indicated by a dashed outline of the same shape). Keep the dashed target position unchanged. Move the circle object to the dashed target position along the shortest path, ensuring it completely overlaps with the target. \ No newline at end of file diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/final_frame.png b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1b18a99d1417e75268bee637d502d7bbabfd620a Binary files /dev/null and b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/final_frame.png differ diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/first_frame.png b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7679f054e5a808dc84157466316255b9dc2fb6de Binary files /dev/null and b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/first_frame.png differ diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/ground_truth.mp4 b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..158cd80bf92417d73a425c020e674b179b0fb54e --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c0f855db00692889c9ddb557dc5bc9b8d9fdc5265300df530ed1927d4eb55e +size 189778 diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/metadata.json b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..cd000568062d572c638329feb2c30063ee4f4f31 --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/metadata.json @@ -0,0 +1,27 @@ +{ + "task_id": "object_trajectory_00000002", + "generator": "object_trajectory", + "timestamp": "2026-02-17T07:07:57.211760", + "parameters": { + "start_pos": [ + 105, + 187 + ], + "end_pos": [ + 517, + 748 + ], + "ball_color": "#583e70", + "shape": "triangle" + }, + "param_hash": "4de99e059b016725", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/prompt.txt b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2f3b9bc54dace2b7951b47c7fc416cafd1e629ba --- /dev/null +++ b/VBVR-Dataset/object_trajectory_task/object_trajectory_00000002/prompt.txt @@ -0,0 +1 @@ +The scene contains a triangle object and a dashed target position (indicated by a dashed outline of the same shape). Keep the dashed target position unchanged. Move the triangle object to the dashed target position along the shortest path, ensuring it completely overlaps with the target. \ No newline at end of file diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/final_frame.png b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..256f4af548e2df273351a093388914bfde6d143c Binary files /dev/null and b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/final_frame.png differ diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/first_frame.png b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..aceeda586be78247ccf8f711f9647259cab42d8c Binary files /dev/null and b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/first_frame.png differ diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/ground_truth.mp4 b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ab97a89b3dd9b8f4ed5b8eeed901dd8e54db9ddf --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be3cfcbddecdaa20b7adcd0005bdce53d4a982036a1760b235a50880d8e4f62 +size 240463 diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/metadata.json b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7ed0b15b57e360e7401e494f4dc354b1eb3d71f7 --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/metadata.json @@ -0,0 +1,60 @@ +{ + "task_id": "predict_next_color_00000000", + "generator": "predict_next_color", + "timestamp": "2026-02-19T02:32:58.463033", + "parameters": { + "sequence": [ + { + "color": [ + 245, + 74, + 245 + ], + "shape": "circle" + }, + { + "color": [ + 245, + 74, + 245 + ], + "shape": "circle" + }, + { + "color": [ + 137, + 215, + 102 + ], + "shape": "circle" + }, + { + "color": [ + 137, + 215, + 102 + ], + "shape": "circle" + } + ], + "answer": { + "color": [ + 245, + 74, + 245 + ], + "shape": "circle" + }, + "pattern_type": "double_alternating" + }, + "param_hash": "9bd3b7b07db18513", + "generation": { + "seed": 901656320, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/prompt.txt b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4443d74b53942d6092665e4d7337ca5f657a0f6 --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000000/prompt.txt @@ -0,0 +1 @@ +Predict the next color in the sequence. \ No newline at end of file diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/final_frame.png b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f4d7d0d550473892d54f10d2ab941f744b5c51d6 Binary files /dev/null and b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/final_frame.png differ diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/first_frame.png b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..82a6060630bb56aaa1cb7254827e9a17287d7786 Binary files /dev/null and b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/first_frame.png differ diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/ground_truth.mp4 b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e57eefcac22874c5df47b249e6d7dd94af0043ab --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b29519aaaff7285e058c723182b1cbdbef6d8169239eace32f57e51a2218f055 +size 213631 diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/metadata.json b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5ba310d1223c62e289134af0a873215610b78a9f --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/metadata.json @@ -0,0 +1,60 @@ +{ + "task_id": "predict_next_color_00000001", + "generator": "predict_next_color", + "timestamp": "2026-02-19T02:32:58.950400", + "parameters": { + "sequence": [ + { + "color": [ + 102, + 252, + 190 + ], + "shape": "pentagon" + }, + { + "color": [ + 168, + 50, + 229 + ], + "shape": "pentagon" + }, + { + "color": [ + 102, + 252, + 190 + ], + "shape": "pentagon" + }, + { + "color": [ + 168, + 50, + 229 + ], + "shape": "pentagon" + } + ], + "answer": { + "color": [ + 102, + 252, + 190 + ], + "shape": "pentagon" + }, + "pattern_type": "alternating" + }, + "param_hash": "1cdb71203344ab26", + "generation": { + "seed": 901656320, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/prompt.txt b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4443d74b53942d6092665e4d7337ca5f657a0f6 --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000001/prompt.txt @@ -0,0 +1 @@ +Predict the next color in the sequence. \ No newline at end of file diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/final_frame.png b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f7d50a3bbf1b45f234934410021baf3e8039a711 Binary files /dev/null and b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/final_frame.png differ diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/first_frame.png b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b6a88b668d2189f6e2cac554767e859290a3c4cf Binary files /dev/null and b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/first_frame.png differ diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/ground_truth.mp4 b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8bffa0d114547ccb815a5784c22f3e4625451175 --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5824800f0a93ff8f0233768289f2b54d866cfba485c039754d5d8f5fa429a6ae +size 179691 diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/metadata.json b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..df6b2d57a289e7ead3471bea620c559a38096aa1 --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/metadata.json @@ -0,0 +1,25 @@ +{ + "task_id": "predict_next_color_00000002", + "generator": "predict_next_color", + "timestamp": "2026-02-17T07:33:05.312728", + "parameters": { + "sequence": [ + "lavender", + "indigo", + "emerald", + "lavender" + ], + "answer": "indigo", + "pattern_type": "triple_pattern" + }, + "param_hash": "f3f38fb7ac3d9639", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/prompt.txt b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e4443d74b53942d6092665e4d7337ca5f657a0f6 --- /dev/null +++ b/VBVR-Dataset/predict_next_color_task/predict_next_color_00000002/prompt.txt @@ -0,0 +1 @@ +Predict the next color in the sequence. \ No newline at end of file diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/._ground_truth.mp4 b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/._ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d083447fe8eebb9b1d6d000fd437864bd0a5d0ce Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/._ground_truth.mp4 differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/final_frame.png b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..789bf3226d6a6de8588f61a89f046139997c2863 Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/final_frame.png differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/first_frame.png b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..186c2714db70603d30923bb3eabc3f5518074c20 Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/first_frame.png differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/ground_truth.mp4 b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..254aa1e868d18b3835894a0e1aff5e0d9081d5cf --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1af154306a730cb7e87927687c50f7ff41802401fbe2ecfa3dbb61a7291e4a1 +size 400748 diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/metadata.json b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f32cf131c931c21818f76ff04b9463098a848694 --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "read_the_chart_data_semantic_comprehension_00000000", + "generator": "read_the_chart_data_semantic_comprehension", + "timestamp": "2026-02-26T09:52:48.710371", + "parameters": { + "row_category": "Quarter", + "row_items": [ + "Q1", + "Q3", + "Q2", + "Q4", + "Total" + ], + "col_category": "Phone", + "col_items": [ + "Mi 14", + "Mate 60", + "Galaxy S24" + ], + "data": { + "Q1": { + "Mi 14": 221, + "Mate 60": 76, + "Galaxy S24": 79 + }, + "Q3": { + "Mi 14": 276, + "Mate 60": 91, + "Galaxy S24": 180 + }, + "Q2": { + "Mi 14": 159, + "Mate 60": 22, + "Galaxy S24": 86 + }, + "Q4": { + "Mi 14": 32, + "Mate 60": 73, + "Galaxy S24": 238 + }, + "Total": { + "Mi 14": 688, + "Mate 60": 262, + "Galaxy S24": 583 + } + }, + "target_row": "Q3", + "target_col": "Mi 14", + "target_value": 276, + "search_direction": "row", + "search_type": "max", + "search_item": "Q3", + "data_type": "sales" + }, + "param_hash": "00506ffa24fe0fa7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/prompt.txt b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0b510fda7f2f026f6b3eaeace8f89d53b8db14be --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a sales table with Quarter as rows and Phone as columns. Find the maximum value within the row corresponding to the Quarter 'Q3' and draw a red rectangular border around the corresponding cell to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/final_frame.png b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7bd3e5871194ec73189870545087bf8b71e81d57 Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/final_frame.png differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/first_frame.png b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..944858b58fe69705d99c0f02baef31bd2bff6090 Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/first_frame.png differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/ground_truth.mp4 b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2ba5f9355f953c020fe1ea91726f9e962d1061e9 --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9030e01816cdca6f2a3aea66f0abb661abadacd75eaf2958a8ed4cca0ab5566c +size 437736 diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/metadata.json b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..31d02e5e090a4b8a09c627c4e6211fe872a1bc5e --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "read_the_chart_data_semantic_comprehension_00000001", + "generator": "read_the_chart_data_semantic_comprehension", + "timestamp": "2026-02-26T09:52:49.301953", + "parameters": { + "row_category": "Dept", + "row_items": [ + "Logistics", + "Support", + "Marketing", + "Sales", + "Total" + ], + "col_category": "Color", + "col_items": [ + "Yellow", + "Red", + "Black", + "White" + ], + "data": { + "Logistics": { + "Yellow": 130, + "Red": 168, + "Black": 77, + "White": 183 + }, + "Support": { + "Yellow": 15, + "Red": 53, + "Black": 100, + "White": 94 + }, + "Marketing": { + "Yellow": 144, + "Red": 103, + "Black": 117, + "White": 193 + }, + "Sales": { + "Yellow": 191, + "Red": 105, + "Black": 185, + "White": 122 + }, + "Total": { + "Yellow": 480, + "Red": 429, + "Black": 479, + "White": 592 + } + }, + "target_row": "Logistics", + "target_col": "Black", + "target_value": 77, + "search_direction": "column", + "search_type": "min", + "search_item": "Black", + "data_type": "inventory" + }, + "param_hash": "91a939171fd3c49f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/prompt.txt b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..b40cac439c2681a4228f7cea2b5d104d0ca0fa35 --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a inventory table with Dept as rows and Color as columns. Find the minimum value within the column corresponding to the Color 'Black' and draw a red rectangular border around the corresponding cell to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/final_frame.png b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..13afac5b3313b2c4a31198d69a2a6646decca5d6 Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/final_frame.png differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/first_frame.png b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6d1547318f80338f552d2b4beda92642031d23ed Binary files /dev/null and b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/first_frame.png differ diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/ground_truth.mp4 b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2f81b093391ae6b7c72a8a5569d09e01c72847b1 --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eac14297c0bec4e9675a78b62d31ac7138ad42b8425503ae005347c2b8d597f0 +size 388442 diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/metadata.json b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..18229c20b295df705ecc58089d236731fa69a727 --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "read_the_chart_data_semantic_comprehension_00000002", + "generator": "read_the_chart_data_semantic_comprehension", + "timestamp": "2026-02-26T09:52:49.871916", + "parameters": { + "row_category": "Dept", + "row_items": [ + "Sales", + "Logistics", + "Support", + "Marketing", + "Total" + ], + "col_category": "Color", + "col_items": [ + "White", + "Red", + "Blue" + ], + "data": { + "Sales": { + "White": 97, + "Red": 65, + "Blue": 108 + }, + "Logistics": { + "White": 135, + "Red": 11, + "Blue": 153 + }, + "Support": { + "White": 21, + "Red": 189, + "Blue": 96 + }, + "Marketing": { + "White": 169, + "Red": 164, + "Blue": 81 + }, + "Total": { + "White": 422, + "Red": 429, + "Blue": 438 + } + }, + "target_row": "Logistics", + "target_col": "Red", + "target_value": 11, + "search_direction": "column", + "search_type": "min", + "search_item": "Red", + "data_type": "inventory" + }, + "param_hash": "837b1c2dd0b7de68", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/prompt.txt b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..3720b7578821903c190fe5d7dff3aee36f3ed648 --- /dev/null +++ b/VBVR-Dataset/read_the_chart_data_semantic_comprehension_task/read_the_chart_data_semantic_comprehension_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a inventory table with Dept as rows and Color as columns. Find the minimum value within the column corresponding to the Color 'Red' and draw a red rectangular border around the corresponding cell to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/final_frame.png b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c48b9cd3a2f80607749b0f28b1c61fd7913837da Binary files /dev/null and b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/final_frame.png differ diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/first_frame.png b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0384f896d03c2b3b7bc82491bfaa47fe87ecae80 Binary files /dev/null and b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/first_frame.png differ diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/ground_truth.mp4 b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e4494d9e3b5b4645baeae6f5f81c3221fd06b6c5 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f06a36fdf1905a41338a9551da9ed1067e250d35e4267c1a00f5363ac48cc6 +size 122548 diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/metadata.json b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd8276acf78bd0d881ffdcb0268d54f2e1dc077 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/metadata.json @@ -0,0 +1,76 @@ +{ + "task_id": "reorder_objects_00000000", + "generator": "reorder_objects", + "timestamp": "2026-02-17T07:20:23.095378", + "parameters": { + "num_objects": 4, + "objects": [ + { + "shape": "cylinder", + "color": [ + 234, + 84, + 85 + ], + "pos": [ + 253, + 512 + ], + "size": 68 + }, + { + "shape": "circle", + "color": [ + 230, + 126, + 34 + ], + "pos": [ + 425, + 512 + ], + "size": 68 + }, + { + "shape": "cylinder", + "color": [ + 230, + 126, + 34 + ], + "pos": [ + 597, + 512 + ], + "size": 68 + }, + { + "shape": "triangle", + "color": [ + 46, + 204, + 113 + ], + "pos": [ + 769, + 512 + ], + "size": 68 + } + ], + "swap_indices": [ + 3, + 1 + ] + }, + "param_hash": "795864aba887343a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/prompt.txt b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..86e17d9656e87c4872435171ffdd5ae5b94ef416 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000000/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple objects arranged in a horizontal line. Keep all other objects unchanged. Swap the positions of the 4th and 2nd objects from the left using shortest paths. \ No newline at end of file diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/final_frame.png b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c21c1e41bce17ab515593daee827188e3e5ed0c9 Binary files /dev/null and b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/final_frame.png differ diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/first_frame.png b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..77509d0270f786f91ec69458877e1c20e0083a13 Binary files /dev/null and b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/first_frame.png differ diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/ground_truth.mp4 b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..35ab60027886da9f85ec76553b693d33c2dd98a6 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f9dd4e586957e11c52d6d0be172a05adbad8af99211840463dee480568a24c +size 107020 diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/metadata.json b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8570211783efa064266c0adc23b9245de13e7341 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/metadata.json @@ -0,0 +1,102 @@ +{ + "task_id": "reorder_objects_00000001", + "generator": "reorder_objects", + "timestamp": "2026-02-17T07:20:23.444689", + "parameters": { + "num_objects": 6, + "objects": [ + { + "shape": "circle", + "color": [ + 230, + 126, + 34 + ], + "pos": [ + 204, + 512 + ], + "size": 49 + }, + { + "shape": "circle", + "color": [ + 241, + 196, + 15 + ], + "pos": [ + 327, + 512 + ], + "size": 49 + }, + { + "shape": "cylinder", + "color": [ + 241, + 196, + 15 + ], + "pos": [ + 450, + 512 + ], + "size": 49 + }, + { + "shape": "square", + "color": [ + 46, + 204, + 113 + ], + "pos": [ + 573, + 512 + ], + "size": 49 + }, + { + "shape": "triangle", + "color": [ + 241, + 196, + 15 + ], + "pos": [ + 696, + 512 + ], + "size": 49 + }, + { + "shape": "circle", + "color": [ + 52, + 152, + 219 + ], + "pos": [ + 819, + 512 + ], + "size": 49 + } + ], + "swap_indices": [ + 0, + 1 + ] + }, + "param_hash": "0070c7a08c047d4e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/prompt.txt b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f34c5e2f68e87a6f96b6701258657b7377439e2 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000001/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple objects arranged in a horizontal line. Keep all other objects unchanged. Swap the positions of the 1st and 2nd objects from the left using shortest paths. \ No newline at end of file diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/final_frame.png b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..97e4b19092d36aa40ee57787c19e4b99987e5f2d Binary files /dev/null and b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/final_frame.png differ diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/first_frame.png b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f772b2b483e32d66e7b1f0c37e5a730cc8c1a103 Binary files /dev/null and b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/first_frame.png differ diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/ground_truth.mp4 b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..252669d66bfbd21bf0ffd63a0dd617f2fef1dad1 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd718fac39cbbde0753fadb3267d4b1d092ecdb447115ac7a05af6b71b15b93b +size 140456 diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/metadata.json b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5a91cfee3cfad07515933677a1d2820f6241f879 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/metadata.json @@ -0,0 +1,76 @@ +{ + "task_id": "reorder_objects_00000002", + "generator": "reorder_objects", + "timestamp": "2026-02-17T07:20:23.791500", + "parameters": { + "num_objects": 4, + "objects": [ + { + "shape": "circle", + "color": [ + 52, + 152, + 219 + ], + "pos": [ + 253, + 512 + ], + "size": 68 + }, + { + "shape": "cylinder", + "color": [ + 230, + 126, + 34 + ], + "pos": [ + 425, + 512 + ], + "size": 68 + }, + { + "shape": "cylinder", + "color": [ + 46, + 204, + 113 + ], + "pos": [ + 597, + 512 + ], + "size": 68 + }, + { + "shape": "hexagon", + "color": [ + 241, + 196, + 15 + ], + "pos": [ + 769, + 512 + ], + "size": 68 + } + ], + "swap_indices": [ + 3, + 0 + ] + }, + "param_hash": "2279faf9b3f270bc", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/prompt.txt b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d99dcc932004349b01c719b8c441eaa64d6ed28 --- /dev/null +++ b/VBVR-Dataset/reorder_objects_task/reorder_objects_00000002/prompt.txt @@ -0,0 +1 @@ +The scene contains multiple objects arranged in a horizontal line. Keep all other objects unchanged. Swap the positions of the 4th and 1st objects from the left using shortest paths. \ No newline at end of file diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000000/final_frame.png b/VBVR-Dataset/resize_object_task/resize_object_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5b6937f279348e23e8beb640c01b633f6e5edceb Binary files /dev/null and b/VBVR-Dataset/resize_object_task/resize_object_00000000/final_frame.png differ diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000000/first_frame.png b/VBVR-Dataset/resize_object_task/resize_object_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6bf8b1e0e71d74b0b32b1191fee98a07df21a260 Binary files /dev/null and b/VBVR-Dataset/resize_object_task/resize_object_00000000/first_frame.png differ diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000000/ground_truth.mp4 b/VBVR-Dataset/resize_object_task/resize_object_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..10d4fc4dd8b094183e4d3471f715c62eb92b2cf0 --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c12ce76cc1b8289dc896eee1b670c9e07b18f2091f01b68cb1c989e0b44251a +size 134325 diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000000/metadata.json b/VBVR-Dataset/resize_object_task/resize_object_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7ffa76c4e563a7d4ec899428e56047f84809753a --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000000/metadata.json @@ -0,0 +1,27 @@ +{ + "task_id": "resize_object_00000000", + "generator": "resize_object", + "timestamp": "2026-02-17T07:34:18.292769", + "parameters": { + "layout": "horizontal", + "shape": "star", + "color": [ + 76, + 114, + 153 + ], + "source_size": 81, + "target_size": 124, + "reference_side": "left" + }, + "param_hash": "4b7721e7a0de264d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000000/prompt.txt b/VBVR-Dataset/resize_object_task/resize_object_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..167308a3f61f6ae1032ff9404cea9f768523af3f --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000000/prompt.txt @@ -0,0 +1 @@ +Resize the right object so its size matches the left reference object. Only change size. \ No newline at end of file diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000001/final_frame.png b/VBVR-Dataset/resize_object_task/resize_object_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3b9a71b01fe9dc5f5bb22248efebdedf58c3c376 Binary files /dev/null and b/VBVR-Dataset/resize_object_task/resize_object_00000001/final_frame.png differ diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000001/first_frame.png b/VBVR-Dataset/resize_object_task/resize_object_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1d3f35c31917ef828963fe7807c115732bf50b2e Binary files /dev/null and b/VBVR-Dataset/resize_object_task/resize_object_00000001/first_frame.png differ diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000001/ground_truth.mp4 b/VBVR-Dataset/resize_object_task/resize_object_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4452e7c395d2921a9957c74688a226da373afec5 --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3cd34f61a99f302b8fcc12bc41e0895e6baa35bbc5852091d7be71cfc0eeb5 +size 110511 diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000001/metadata.json b/VBVR-Dataset/resize_object_task/resize_object_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d6114ef114f2405cf4f2eb3b686249240d89fd92 --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000001/metadata.json @@ -0,0 +1,27 @@ +{ + "task_id": "resize_object_00000001", + "generator": "resize_object", + "timestamp": "2026-02-17T07:34:18.661973", + "parameters": { + "layout": "vertical", + "shape": "octagon", + "color": [ + 215, + 229, + 114 + ], + "source_size": 53, + "target_size": 89, + "reference_side": "top" + }, + "param_hash": "2751931ccba8c469", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000001/prompt.txt b/VBVR-Dataset/resize_object_task/resize_object_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d04e6631bfd018339c264a333f5c13e39f7bfd07 --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000001/prompt.txt @@ -0,0 +1 @@ +Resize the bottom object so its size matches the top reference object. Only change size. \ No newline at end of file diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000002/final_frame.png b/VBVR-Dataset/resize_object_task/resize_object_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..61fddf74b67e079770513590c1db502e23ffdc7e Binary files /dev/null and b/VBVR-Dataset/resize_object_task/resize_object_00000002/final_frame.png differ diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000002/first_frame.png b/VBVR-Dataset/resize_object_task/resize_object_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b792212a0ef2bf57833cef0fdde751d9529fbf2b Binary files /dev/null and b/VBVR-Dataset/resize_object_task/resize_object_00000002/first_frame.png differ diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000002/ground_truth.mp4 b/VBVR-Dataset/resize_object_task/resize_object_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8bcd00ef9c10835d4dc64e093e5a6d26f3af197c --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35742bf812e8ab61de524dcda48cb159df2b1b460e2260ac9dff0164f5873d26 +size 104781 diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000002/metadata.json b/VBVR-Dataset/resize_object_task/resize_object_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..10a97e06c65d6eca11ecb92fe9b05381cb360bf4 --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000002/metadata.json @@ -0,0 +1,27 @@ +{ + "task_id": "resize_object_00000002", + "generator": "resize_object", + "timestamp": "2026-02-17T07:34:19.026424", + "parameters": { + "layout": "horizontal", + "shape": "cross", + "color": [ + 30, + 112, + 153 + ], + "source_size": 116, + "target_size": 79, + "reference_side": "left" + }, + "param_hash": "5b12536dcdc71d39", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/resize_object_task/resize_object_00000002/prompt.txt b/VBVR-Dataset/resize_object_task/resize_object_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..167308a3f61f6ae1032ff9404cea9f768523af3f --- /dev/null +++ b/VBVR-Dataset/resize_object_task/resize_object_00000002/prompt.txt @@ -0,0 +1 @@ +Resize the right object so its size matches the left reference object. Only change size. \ No newline at end of file diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/final_frame.png b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ac50c36e3295d0157e96937b4fcf38552fdf1a7e Binary files /dev/null and b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/final_frame.png differ diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/first_frame.png b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c541ca1267003457c63bfab766d6a3c8b24c5b86 Binary files /dev/null and b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/first_frame.png differ diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/ground_truth.mp4 b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d95af1f2ac73a0f48dc1f3e680209082880db6b5 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf57cf4e103b0c3a94994e45a7facf0dcbb8218cedc369634231055d4a5dbb7 +size 103675 diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/metadata.json b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..eeb812e088ae6dfcb50b6d8b71b5c275503ddb4e --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/metadata.json @@ -0,0 +1,69 @@ +{ + "task_id": "return_to_correct_bin_00000000", + "generator": "return_to_correct_bin", + "timestamp": "2026-02-17T07:34:50.740296", + "parameters": { + "bins": [ + { + "id": 0, + "color": [ + 49, + 37, + 168 + ], + "x": 341, + "y": 204 + }, + { + "id": 1, + "color": [ + 155, + 227, + 181 + ], + "x": 682, + "y": 204 + } + ], + "items": [ + { + "color": [ + 49, + 37, + 168 + ], + "shape": "square", + "bin_index": 0, + "size": 60, + "initial_x": 179, + "initial_y": 883, + "final_x": 301, + "final_y": 206 + }, + { + "color": [ + 155, + 227, + 181 + ], + "shape": "triangle", + "bin_index": 1, + "size": 60, + "initial_x": 688, + "initial_y": 513, + "final_x": 636, + "final_y": 209 + } + ] + }, + "param_hash": "72ef4afc7a66fd3c", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/prompt.txt b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bca1f25eba773b54a4e1f5381e252ff7bf1f527 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000000/prompt.txt @@ -0,0 +1 @@ +Move each item into the bin that matches its color. Only move items, do not change anything else. \ No newline at end of file diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/final_frame.png b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f13aa0dbb4bdecfb4cbbea05a30e21a23c18056c Binary files /dev/null and b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/final_frame.png differ diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/first_frame.png b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..297a1a1d69b9d526815c2bf8c45f2df4c6d2ab0c Binary files /dev/null and b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/first_frame.png differ diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/ground_truth.mp4 b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..60b8ad113a16ebf5e4de6ace670683d751153830 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eaf2f7e924beb1197b1f853d20a31b77f2b98f6536cbd51d386e2856d711eee +size 268628 diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/metadata.json b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d5a3676cb92f341ba1373c3c05e14930fcea0a78 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/metadata.json @@ -0,0 +1,121 @@ +{ + "task_id": "return_to_correct_bin_00000001", + "generator": "return_to_correct_bin", + "timestamp": "2026-02-17T07:34:51.347246", + "parameters": { + "bins": [ + { + "id": 0, + "color": [ + 2, + 66, + 12 + ], + "x": 256, + "y": 204 + }, + { + "id": 1, + "color": [ + 53, + 218, + 76 + ], + "x": 512, + "y": 204 + }, + { + "id": 2, + "color": [ + 24, + 124, + 171 + ], + "x": 768, + "y": 204 + } + ], + "items": [ + { + "color": [ + 2, + 66, + 12 + ], + "shape": "triangle", + "bin_index": 0, + "size": 60, + "initial_x": 208, + "initial_y": 851, + "final_x": 211, + "final_y": 216 + }, + { + "color": [ + 2, + 66, + 12 + ], + "shape": "square", + "bin_index": 0, + "size": 60, + "initial_x": 692, + "initial_y": 641, + "final_x": 259, + "final_y": 212 + }, + { + "color": [ + 53, + 218, + 76 + ], + "shape": "triangle", + "bin_index": 1, + "size": 60, + "initial_x": 928, + "initial_y": 392, + "final_x": 465, + "final_y": 202 + }, + { + "color": [ + 24, + 124, + 171 + ], + "shape": "circle", + "bin_index": 2, + "size": 60, + "initial_x": 235, + "initial_y": 733, + "final_x": 722, + "final_y": 209 + }, + { + "color": [ + 24, + 124, + 171 + ], + "shape": "triangle", + "bin_index": 2, + "size": 60, + "initial_x": 398, + "initial_y": 908, + "final_x": 766, + "final_y": 207 + } + ] + }, + "param_hash": "43047c030e9e972b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/prompt.txt b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bca1f25eba773b54a4e1f5381e252ff7bf1f527 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000001/prompt.txt @@ -0,0 +1 @@ +Move each item into the bin that matches its color. Only move items, do not change anything else. \ No newline at end of file diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/final_frame.png b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f1fd5f6dec05524540d7deb28333c462636cd54b Binary files /dev/null and b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/final_frame.png differ diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/first_frame.png b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a868950f5d329c56a6f4fc05957a82ce6a71c577 Binary files /dev/null and b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/first_frame.png differ diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/ground_truth.mp4 b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..08ff19ae54f357aecdfe770b42615f1a47d81982 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038a852859acfc9f05fc9dd0f9fd864ff9fede37ddfafa07d545b5b664e10aa4 +size 165823 diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/metadata.json b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ef85c5f1836bec6b5ee0be7e2d325eaedf1fea82 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/metadata.json @@ -0,0 +1,107 @@ +{ + "task_id": "return_to_correct_bin_00000002", + "generator": "return_to_correct_bin", + "timestamp": "2026-02-17T07:34:51.851421", + "parameters": { + "bins": [ + { + "id": 0, + "color": [ + 190, + 225, + 207 + ], + "x": 256, + "y": 204 + }, + { + "id": 1, + "color": [ + 254, + 177, + 178 + ], + "x": 512, + "y": 204 + }, + { + "id": 2, + "color": [ + 10, + 63, + 60 + ], + "x": 768, + "y": 204 + } + ], + "items": [ + { + "color": [ + 190, + 225, + 207 + ], + "shape": "square", + "bin_index": 0, + "size": 60, + "initial_x": 454, + "initial_y": 871, + "final_x": 209, + "final_y": 202 + }, + { + "color": [ + 254, + 177, + 178 + ], + "shape": "square", + "bin_index": 1, + "size": 60, + "initial_x": 64, + "initial_y": 945, + "final_x": 473, + "final_y": 213 + }, + { + "color": [ + 10, + 63, + 60 + ], + "shape": "square", + "bin_index": 2, + "size": 60, + "initial_x": 864, + "initial_y": 415, + "final_x": 726, + "final_y": 207 + }, + { + "color": [ + 10, + 63, + 60 + ], + "shape": "circle", + "bin_index": 2, + "size": 60, + "initial_x": 778, + "initial_y": 716, + "final_x": 761, + "final_y": 202 + } + ] + }, + "param_hash": "e2642123985356b8", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/prompt.txt b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6bca1f25eba773b54a4e1f5381e252ff7bf1f527 --- /dev/null +++ b/VBVR-Dataset/return_to_correct_bin_task/return_to_correct_bin_00000002/prompt.txt @@ -0,0 +1 @@ +Move each item into the bin that matches its color. Only move items, do not change anything else. \ No newline at end of file diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/final_frame.png b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..53f19bba760957679e9241391838f8d9e87502a4 Binary files /dev/null and b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/final_frame.png differ diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/first_frame.png b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f29ee3a8e36723b64e7da780d9247b080768f1eb Binary files /dev/null and b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/first_frame.png differ diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/ground_truth.mp4 b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..96eb552d5658b60831de8a918c4d5350b2066996 --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa6caaaf8e31a61fbc641fd8a01ba9d722a7e4c5ec7d672cafeaf81b0f06416c +size 195725 diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/metadata.json b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..68d899fa0fb78fb845a8b0eab38a1253b421064b --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/metadata.json @@ -0,0 +1,282 @@ +{ + "task_id": "rolling_ball_00000000", + "generator": "rolling_ball", + "timestamp": "2026-02-17T07:48:19.503236", + "parameters": { + "num_platforms": 11, + "trajectory_type": "default", + "objects": [ + { + "symbol": "ball", + "radius": 0.04, + "color": [ + 255, + 80, + 80 + ], + "initial_center_3d": [ + 0.149, + 0.361, + 0.215 + ], + "final_center_3d": [ + 3.614, + -0.222, + 0.215 + ] + }, + { + "symbol": "platform", + "index": 0, + "position_3d": [ + 0.149, + 0.361, + 0.2 + ], + "direction": [ + 0.465, + -0.885, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 1, + "position_3d": [ + 0.389, + 0.066, + 0.2 + ], + "direction": [ + 0.684, + -0.729, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 2, + "position_3d": [ + 0.729, + -0.088, + 0.2 + ], + "direction": [ + 0.958, + -0.286, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 3, + "position_3d": [ + 1.104, + -0.075, + 0.2 + ], + "direction": [ + 0.989, + 0.147, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 4, + "position_3d": [ + 1.471, + 0.031, + 0.2 + ], + "direction": [ + 0.947, + 0.322, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 5, + "position_3d": [ + 1.833, + 0.156, + 0.2 + ], + "direction": [ + 0.944, + 0.329, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 6, + "position_3d": [ + 2.204, + 0.248, + 0.2 + ], + "direction": [ + 0.978, + 0.208, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 7, + "position_3d": [ + 2.584, + 0.256, + 0.2 + ], + "direction": [ + 0.999, + -0.043, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 8, + "position_3d": [ + 2.95, + 0.156, + 0.2 + ], + "direction": [ + 0.941, + -0.339, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 9, + "position_3d": [ + 3.286, + -0.024, + 0.2 + ], + "direction": [ + 0.855, + -0.518, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + }, + { + "symbol": "platform", + "index": 10, + "position_3d": [ + 3.614, + -0.222, + 0.2 + ], + "direction": [ + 0.856, + -0.518, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 70, + 130, + 200 + ] + } + ] + }, + "param_hash": "bfcc29e3fbc2dbcd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/prompt.txt b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4af8d2c89c758c5589fc835cd4bf3ea09ca5589c --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a ball and a series of platforms arranged along a curved path. Animate the ball rolling along the trajectory path, smoothly transitioning from one platform to the next, landing on each platform in sequence, and coming to rest on the final platform. \ No newline at end of file diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/final_frame.png b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ab102f2a965a56a51148f1e498c92e1a766a0ef4 Binary files /dev/null and b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/final_frame.png differ diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/first_frame.png b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b28132dd9a81dc967c675ec7116920954b51c498 Binary files /dev/null and b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/first_frame.png differ diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/ground_truth.mp4 b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3aa662f62497b027f59034bb312c7e1683929c61 --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2602621ea7e256dee11130134f559dbcf85cbb57cad50cef2f20f59d365984c +size 198269 diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/metadata.json b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f7c4df151199a3d433a5de3a4b5ef49805d198f8 --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/metadata.json @@ -0,0 +1,392 @@ +{ + "task_id": "rolling_ball_00000001", + "generator": "rolling_ball", + "timestamp": "2026-02-17T07:48:20.667443", + "parameters": { + "num_platforms": 16, + "trajectory_type": "complex", + "objects": [ + { + "symbol": "ball", + "radius": 0.04, + "color": [ + 255, + 50, + 50 + ], + "initial_center_3d": [ + 0.104, + 0.286, + 0.215 + ], + "final_center_3d": [ + 4.485, + 2.44, + 0.215 + ] + }, + { + "symbol": "platform", + "index": 0, + "position_3d": [ + 0.104, + 0.286, + 0.2 + ], + "direction": [ + 0.852, + 0.523, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 1, + "position_3d": [ + 0.393, + 0.454, + 0.2 + ], + "direction": [ + 0.869, + 0.495, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 2, + "position_3d": [ + 0.69, + 0.608, + 0.2 + ], + "direction": [ + 0.896, + 0.444, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 3, + "position_3d": [ + 0.998, + 0.741, + 0.2 + ], + "direction": [ + 0.927, + 0.376, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 4, + "position_3d": [ + 1.314, + 0.849, + 0.2 + ], + "direction": [ + 0.954, + 0.301, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 5, + "position_3d": [ + 1.638, + 0.934, + 0.2 + ], + "direction": [ + 0.973, + 0.232, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 6, + "position_3d": [ + 1.966, + 1.0, + 0.2 + ], + "direction": [ + 0.983, + 0.185, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 7, + "position_3d": [ + 2.296, + 1.059, + 0.2 + ], + "direction": [ + 0.985, + 0.17, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 8, + "position_3d": [ + 2.625, + 1.122, + 0.2 + ], + "direction": [ + 0.98, + 0.198, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 9, + "position_3d": [ + 2.949, + 1.206, + 0.2 + ], + "direction": [ + 0.962, + 0.273, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 10, + "position_3d": [ + 3.262, + 1.325, + 0.2 + ], + "direction": [ + 0.921, + 0.389, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 11, + "position_3d": [ + 3.554, + 1.487, + 0.2 + ], + "direction": [ + 0.851, + 0.524, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 12, + "position_3d": [ + 3.818, + 1.691, + 0.2 + ], + "direction": [ + 0.763, + 0.646, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 13, + "position_3d": [ + 4.055, + 1.927, + 0.2 + ], + "direction": [ + 0.683, + 0.731, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 14, + "position_3d": [ + 4.272, + 2.182, + 0.2 + ], + "direction": [ + 0.635, + 0.772, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + }, + { + "symbol": "platform", + "index": 15, + "position_3d": [ + 4.485, + 2.44, + 0.2 + ], + "direction": [ + 0.635, + 0.772, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 0, + 191, + 255 + ] + } + ] + }, + "param_hash": "ffecd4bc0d463231", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/prompt.txt b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4af8d2c89c758c5589fc835cd4bf3ea09ca5589c --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a ball and a series of platforms arranged along a curved path. Animate the ball rolling along the trajectory path, smoothly transitioning from one platform to the next, landing on each platform in sequence, and coming to rest on the final platform. \ No newline at end of file diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/final_frame.png b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0e4a3d02b91d8a14aabedfa5d85e48514f826051 Binary files /dev/null and b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/final_frame.png differ diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/first_frame.png b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d9f713ef8079844ad3654ad4a432c60939f11e03 Binary files /dev/null and b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/first_frame.png differ diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/ground_truth.mp4 b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4df6b8fef3a755238a88b0d86b5dbb7ec9d50fb9 --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95ca9610dd07d85834269344d07257e8371480a4c39f983813db3a3b0b2782f +size 208516 diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/metadata.json b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6026db22e8b26c7a722f8cb4200b04c793ba5ecd --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/metadata.json @@ -0,0 +1,260 @@ +{ + "task_id": "rolling_ball_00000002", + "generator": "rolling_ball", + "timestamp": "2026-02-17T07:48:21.673170", + "parameters": { + "num_platforms": 10, + "trajectory_type": "default", + "objects": [ + { + "symbol": "ball", + "radius": 0.04, + "color": [ + 255, + 140, + 0 + ], + "initial_center_3d": [ + 0.238, + 0.405, + 0.215 + ], + "final_center_3d": [ + 3.145, + 1.067, + 0.215 + ] + }, + { + "symbol": "platform", + "index": 0, + "position_3d": [ + 0.238, + 0.405, + 0.2 + ], + "direction": [ + 1.0, + 0.025, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 1, + "position_3d": [ + 0.606, + 0.384, + 0.2 + ], + "direction": [ + 0.996, + -0.087, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 2, + "position_3d": [ + 0.968, + 0.319, + 0.2 + ], + "direction": [ + 0.977, + -0.211, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 3, + "position_3d": [ + 1.325, + 0.228, + 0.2 + ], + "direction": [ + 0.966, + -0.259, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 4, + "position_3d": [ + 1.686, + 0.153, + 0.2 + ], + "direction": [ + 0.983, + -0.183, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 5, + "position_3d": [ + 2.053, + 0.15, + 0.2 + ], + "direction": [ + 0.998, + 0.058, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 6, + "position_3d": [ + 2.397, + 0.268, + 0.2 + ], + "direction": [ + 0.909, + 0.416, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 7, + "position_3d": [ + 2.684, + 0.493, + 0.2 + ], + "direction": [ + 0.73, + 0.684, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 8, + "position_3d": [ + 2.921, + 0.775, + 0.2 + ], + "direction": [ + 0.61, + 0.793, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + }, + { + "symbol": "platform", + "index": 9, + "position_3d": [ + 3.145, + 1.067, + 0.2 + ], + "direction": [ + 0.61, + 0.793, + 0.0 + ], + "length": 0.2, + "width": 0.2, + "thickness": 0.03, + "color": [ + 50, + 120, + 240 + ] + } + ] + }, + "param_hash": "aad8ec216cfe4ea5", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/prompt.txt b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4af8d2c89c758c5589fc835cd4bf3ea09ca5589c --- /dev/null +++ b/VBVR-Dataset/rolling_ball_task/rolling_ball_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a ball and a series of platforms arranged along a curved path. Animate the ball rolling along the trajectory path, smoothly transitioning from one platform to the next, landing on each platform in sequence, and coming to rest on the final platform. \ No newline at end of file diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/final_frame.png b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f03249c8ef4fa22cfd56765ef85d436b63ce1283 Binary files /dev/null and b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/final_frame.png differ diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/first_frame.png b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..316fccdb484ed5d0499a564fef0dc81d3dd7a125 Binary files /dev/null and b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/first_frame.png differ diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/ground_truth.mp4 b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a8cd9cd6698735f7415ec5c5aa071533c8ef73d0 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a7ee3ffe584720d667b7d8ab0e64ac850d3ffbb70a051a53e6e6bcf20ec50b +size 344516 diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/metadata.json b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..19fb40c6970fd74b05a1b279a646f55efed33017 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/metadata.json @@ -0,0 +1,111 @@ +{ + "task_id": "rotation_puzzle_00000000", + "generator": "rotation_puzzle", + "timestamp": "2026-02-17T07:53:14.047098", + "parameters": { + "difficulty": "medium", + "square_size": 220, + "pipe_color": [ + 14, + 165, + 233 + ], + "num_squares": 4, + "objects": [ + { + "symbol": "square_0", + "index": 0, + "position": [ + 277, + 277 + ], + "center": [ + 387.0, + 387.0 + ], + "pipe_pattern": { + "top": false, + "right": true, + "bottom": true, + "left": false + }, + "initial_angle": 286, + "target_angle": 0, + "rotation_angle": 74 + }, + { + "symbol": "square_1", + "index": 1, + "position": [ + 527, + 277 + ], + "center": [ + 637.0, + 387.0 + ], + "pipe_pattern": { + "top": false, + "right": false, + "bottom": true, + "left": true + }, + "initial_angle": 0, + "target_angle": 0, + "rotation_angle": 0 + }, + { + "symbol": "square_2", + "index": 2, + "position": [ + 277, + 527 + ], + "center": [ + 387.0, + 637.0 + ], + "pipe_pattern": { + "top": true, + "right": true, + "bottom": false, + "left": false + }, + "initial_angle": 332, + "target_angle": 0, + "rotation_angle": 28 + }, + { + "symbol": "square_3", + "index": 3, + "position": [ + 527, + 527 + ], + "center": [ + 637.0, + 637.0 + ], + "pipe_pattern": { + "top": true, + "right": false, + "bottom": false, + "left": true + }, + "initial_angle": 0, + "target_angle": 0, + "rotation_angle": 0 + } + ] + }, + "param_hash": "ffa9316ebe9b2bb6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/prompt.txt b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea5b5a45a8579484cbd8400193e9f5c098e76081 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000000/prompt.txt @@ -0,0 +1 @@ +Solve this rotation puzzle by rotating the four squares to connect the pipe paths. Each square can be rotated 90 degrees clockwise or counterclockwise. Rotate the squares so that all pipe paths connect to form a continuous path. Keep the camera view fixed in the top-down perspective and maintain all square positions unchanged. Stop the video when all pipes are connected and the puzzle is solved. \ No newline at end of file diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/final_frame.png b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..01b7e5a6423b10ea826e9b19466311ea4aa1b51b Binary files /dev/null and b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/final_frame.png differ diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/first_frame.png b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..83616b512640b736fde65927e90fce1f1a526c7c Binary files /dev/null and b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/first_frame.png differ diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/ground_truth.mp4 b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c4361e97db55df3240eb91378b41c1cf0feaab31 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40c04e14cbedc19a6ed2b8550cf0eefe9e0dc630a669c52294e333704b3c59a9 +size 372635 diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/metadata.json b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ee83100dafe1a09f71ad0a6b524030e525c87001 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/metadata.json @@ -0,0 +1,111 @@ +{ + "task_id": "rotation_puzzle_00000001", + "generator": "rotation_puzzle", + "timestamp": "2026-02-17T07:53:16.560093", + "parameters": { + "difficulty": "medium", + "square_size": 220, + "pipe_color": [ + 99, + 102, + 241 + ], + "num_squares": 4, + "objects": [ + { + "symbol": "square_0", + "index": 0, + "position": [ + 277, + 277 + ], + "center": [ + 387.0, + 387.0 + ], + "pipe_pattern": { + "top": false, + "right": true, + "bottom": true, + "left": false + }, + "initial_angle": 202, + "target_angle": 0, + "rotation_angle": 158 + }, + { + "symbol": "square_1", + "index": 1, + "position": [ + 527, + 277 + ], + "center": [ + 637.0, + 387.0 + ], + "pipe_pattern": { + "top": false, + "right": false, + "bottom": true, + "left": true + }, + "initial_angle": 57, + "target_angle": 0, + "rotation_angle": -57 + }, + { + "symbol": "square_2", + "index": 2, + "position": [ + 277, + 527 + ], + "center": [ + 387.0, + 637.0 + ], + "pipe_pattern": { + "top": true, + "right": true, + "bottom": false, + "left": false + }, + "initial_angle": 0, + "target_angle": 0, + "rotation_angle": 0 + }, + { + "symbol": "square_3", + "index": 3, + "position": [ + 527, + 527 + ], + "center": [ + 637.0, + 637.0 + ], + "pipe_pattern": { + "top": true, + "right": false, + "bottom": false, + "left": true + }, + "initial_angle": 327, + "target_angle": 0, + "rotation_angle": 33 + } + ] + }, + "param_hash": "3e7ed4e20a750dd7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/prompt.txt b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea5b5a45a8579484cbd8400193e9f5c098e76081 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000001/prompt.txt @@ -0,0 +1 @@ +Solve this rotation puzzle by rotating the four squares to connect the pipe paths. Each square can be rotated 90 degrees clockwise or counterclockwise. Rotate the squares so that all pipe paths connect to form a continuous path. Keep the camera view fixed in the top-down perspective and maintain all square positions unchanged. Stop the video when all pipes are connected and the puzzle is solved. \ No newline at end of file diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/final_frame.png b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..13f5529299982b30c76fa684ef14b3982d2974b8 Binary files /dev/null and b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/final_frame.png differ diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/first_frame.png b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d68c2e0491418114dd71fe0d95a1c2ff3a0dd37d Binary files /dev/null and b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/first_frame.png differ diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/ground_truth.mp4 b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..24ce8a90ab6c796564fb91a5849bba5805100d1d --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f585d39f73426d68938edd5d5bab3d0077b1846e1ec9d6bae26f3b71f4548019 +size 304242 diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/metadata.json b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..79151fd4fb5828fc77c29888c7a938e63d852e0c --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/metadata.json @@ -0,0 +1,111 @@ +{ + "task_id": "rotation_puzzle_00000002", + "generator": "rotation_puzzle", + "timestamp": "2026-02-17T07:53:18.626999", + "parameters": { + "difficulty": "medium", + "square_size": 220, + "pipe_color": [ + 168, + 85, + 247 + ], + "num_squares": 4, + "objects": [ + { + "symbol": "square_0", + "index": 0, + "position": [ + 277, + 277 + ], + "center": [ + 387.0, + 387.0 + ], + "pipe_pattern": { + "top": false, + "right": true, + "bottom": true, + "left": false + }, + "initial_angle": 0, + "target_angle": 0, + "rotation_angle": 0 + }, + { + "symbol": "square_1", + "index": 1, + "position": [ + 527, + 277 + ], + "center": [ + 637.0, + 387.0 + ], + "pipe_pattern": { + "top": false, + "right": false, + "bottom": true, + "left": true + }, + "initial_angle": 311, + "target_angle": 0, + "rotation_angle": 49 + }, + { + "symbol": "square_2", + "index": 2, + "position": [ + 277, + 527 + ], + "center": [ + 387.0, + 637.0 + ], + "pipe_pattern": { + "top": true, + "right": true, + "bottom": false, + "left": false + }, + "initial_angle": 3, + "target_angle": 0, + "rotation_angle": -3 + }, + { + "symbol": "square_3", + "index": 3, + "position": [ + 527, + 527 + ], + "center": [ + 637.0, + 637.0 + ], + "pipe_pattern": { + "top": true, + "right": false, + "bottom": false, + "left": true + }, + "initial_angle": 0, + "target_angle": 0, + "rotation_angle": 0 + } + ] + }, + "param_hash": "aa32094da652cc99", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/prompt.txt b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ea5b5a45a8579484cbd8400193e9f5c098e76081 --- /dev/null +++ b/VBVR-Dataset/rotation_puzzle_task/rotation_puzzle_00000002/prompt.txt @@ -0,0 +1 @@ +Solve this rotation puzzle by rotating the four squares to connect the pipe paths. Each square can be rotated 90 degrees clockwise or counterclockwise. Rotate the squares so that all pipe paths connect to form a continuous path. Keep the camera view fixed in the top-down perspective and maintain all square positions unchanged. Stop the video when all pipes are connected and the puzzle is solved. \ No newline at end of file diff --git a/VBVR-Dataset/rotation_task/rotation_00000000/final_frame.png b/VBVR-Dataset/rotation_task/rotation_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..15a07fe22ef36170784f9a38333f689ba04917aa Binary files /dev/null and b/VBVR-Dataset/rotation_task/rotation_00000000/final_frame.png differ diff --git a/VBVR-Dataset/rotation_task/rotation_00000000/first_frame.png b/VBVR-Dataset/rotation_task/rotation_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e234c73aaefdaf80755bdbc9d70c6ce4a49d4226 Binary files /dev/null and b/VBVR-Dataset/rotation_task/rotation_00000000/first_frame.png differ diff --git a/VBVR-Dataset/rotation_task/rotation_00000000/ground_truth.mp4 b/VBVR-Dataset/rotation_task/rotation_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7a5b55777b3844b79c1aad11e65473635af77c85 --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f56b20c20c67f1014340db40c64e176d1a6818dca469c669774c7393b04c93c +size 413888 diff --git a/VBVR-Dataset/rotation_task/rotation_00000000/metadata.json b/VBVR-Dataset/rotation_task/rotation_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..079cd7e321c7fbd360d2cb68d3915fab43fa166f --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000000/metadata.json @@ -0,0 +1,132 @@ +{ + "task_id": "rotation_00000000", + "generator": "rotation", + "timestamp": "2026-02-17T08:00:35.083786", + "parameters": { + "num_voxels": 7, + "rotation_angle": 180, + "initial_view": { + "elevation": 33, + "azimuth": 10 + }, + "final_view": { + "elevation": 33, + "azimuth": 190 + }, + "voxel_color": [ + 0.95, + 0.8, + 0.6 + ], + "objects": [ + { + "symbol": "voxel_0", + "index": 0, + "position_3d": [ + 2, + 0, + 2 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + }, + { + "symbol": "voxel_1", + "index": 1, + "position_3d": [ + 1, + 0, + 2 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + }, + { + "symbol": "voxel_2", + "index": 2, + "position_3d": [ + 0, + 0, + 2 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + }, + { + "symbol": "voxel_3", + "index": 3, + "position_3d": [ + 0, + 1, + 2 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + }, + { + "symbol": "voxel_4", + "index": 4, + "position_3d": [ + 0, + 1, + 1 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + }, + { + "symbol": "voxel_5", + "index": 5, + "position_3d": [ + 0, + 1, + 0 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + }, + { + "symbol": "voxel_6", + "index": 6, + "position_3d": [ + 1, + 1, + 0 + ], + "color": [ + 0.95, + 0.8, + 0.6 + ] + } + ] + }, + "param_hash": "cf6b9a01b42989ab", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rotation_task/rotation_00000000/prompt.txt b/VBVR-Dataset/rotation_task/rotation_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..f72f6003d2417412a8e5b5fc7514d1225eec6d11 --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000000/prompt.txt @@ -0,0 +1 @@ +A 7-block sculpture sits fixed on a table. First frame: Your camera is tilted at 33° elevation, viewing from 10° azimuth. Final frame: Your camera remains at 33° elevation, but rotates horizontally to 190° azimuth. This is a 180-degree rotation Create a smooth video showing the camera's horizontal rotation around the sculpture, and try to maintain the tilted viewing angle throughout. \ No newline at end of file diff --git a/VBVR-Dataset/rotation_task/rotation_00000001/final_frame.png b/VBVR-Dataset/rotation_task/rotation_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..78a4af1c8580377be77b8195f3a65b23de308168 Binary files /dev/null and b/VBVR-Dataset/rotation_task/rotation_00000001/final_frame.png differ diff --git a/VBVR-Dataset/rotation_task/rotation_00000001/first_frame.png b/VBVR-Dataset/rotation_task/rotation_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fbc2529c1de1cc6563884708b8a4063fa92bbb0c Binary files /dev/null and b/VBVR-Dataset/rotation_task/rotation_00000001/first_frame.png differ diff --git a/VBVR-Dataset/rotation_task/rotation_00000001/ground_truth.mp4 b/VBVR-Dataset/rotation_task/rotation_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4823a92acf1193e1508e89e5b662d8cead58d817 --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0a04c18570fbe78938f095d83109b88537fac79de0b45d871630dfa13002d17 +size 236157 diff --git a/VBVR-Dataset/rotation_task/rotation_00000001/metadata.json b/VBVR-Dataset/rotation_task/rotation_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5f2df576ee4e114dc22cf194d8095c445e784ca3 --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000001/metadata.json @@ -0,0 +1,118 @@ +{ + "task_id": "rotation_00000001", + "generator": "rotation", + "timestamp": "2026-02-17T08:00:38.679930", + "parameters": { + "num_voxels": 6, + "rotation_angle": 180, + "initial_view": { + "elevation": 24, + "azimuth": 190 + }, + "final_view": { + "elevation": 24, + "azimuth": 10 + }, + "voxel_color": [ + 0.85, + 0.55, + 0.55 + ], + "objects": [ + { + "symbol": "voxel_0", + "index": 0, + "position_3d": [ + 0, + 3, + 1 + ], + "color": [ + 0.85, + 0.55, + 0.55 + ] + }, + { + "symbol": "voxel_1", + "index": 1, + "position_3d": [ + 1, + 3, + 1 + ], + "color": [ + 0.85, + 0.55, + 0.55 + ] + }, + { + "symbol": "voxel_2", + "index": 2, + "position_3d": [ + 1, + 2, + 1 + ], + "color": [ + 0.85, + 0.55, + 0.55 + ] + }, + { + "symbol": "voxel_3", + "index": 3, + "position_3d": [ + 1, + 1, + 1 + ], + "color": [ + 0.85, + 0.55, + 0.55 + ] + }, + { + "symbol": "voxel_4", + "index": 4, + "position_3d": [ + 1, + 0, + 1 + ], + "color": [ + 0.85, + 0.55, + 0.55 + ] + }, + { + "symbol": "voxel_5", + "index": 5, + "position_3d": [ + 1, + 0, + 0 + ], + "color": [ + 0.85, + 0.55, + 0.55 + ] + } + ] + }, + "param_hash": "9622b0ffc28ff87b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rotation_task/rotation_00000001/prompt.txt b/VBVR-Dataset/rotation_task/rotation_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..78ac4551b5d314bfa91293ce7cb22512f9ba0ec2 --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000001/prompt.txt @@ -0,0 +1 @@ +A 6-block sculpture sits fixed on a table. First frame: Your camera is tilted at 24° elevation, viewing from 190° azimuth. Final frame: Your camera remains at 24° elevation, but rotates horizontally to 10° azimuth. This is a 180-degree rotation Create a smooth video showing the camera's horizontal rotation around the sculpture, and try to maintain the tilted viewing angle throughout. \ No newline at end of file diff --git a/VBVR-Dataset/rotation_task/rotation_00000002/final_frame.png b/VBVR-Dataset/rotation_task/rotation_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..53399290366a8cf05eb180ad20c50f444b08f5d2 Binary files /dev/null and b/VBVR-Dataset/rotation_task/rotation_00000002/final_frame.png differ diff --git a/VBVR-Dataset/rotation_task/rotation_00000002/first_frame.png b/VBVR-Dataset/rotation_task/rotation_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..191310d886afb2653be6e00383b2601519ae5277 Binary files /dev/null and b/VBVR-Dataset/rotation_task/rotation_00000002/first_frame.png differ diff --git a/VBVR-Dataset/rotation_task/rotation_00000002/ground_truth.mp4 b/VBVR-Dataset/rotation_task/rotation_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..17a748a786f8f4ee4a51a62e95c8a6526e2e7a6c --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcced13f7d10541f7a23edba638deabe290c6ee2b35bfd4fb2b8a43022de5f37 +size 268187 diff --git a/VBVR-Dataset/rotation_task/rotation_00000002/metadata.json b/VBVR-Dataset/rotation_task/rotation_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..39b7e2177e91486b1fe11c462000031620c468dc --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000002/metadata.json @@ -0,0 +1,132 @@ +{ + "task_id": "rotation_00000002", + "generator": "rotation", + "timestamp": "2026-02-17T08:00:42.428533", + "parameters": { + "num_voxels": 7, + "rotation_angle": 180, + "initial_view": { + "elevation": 29, + "azimuth": 70 + }, + "final_view": { + "elevation": 29, + "azimuth": 250 + }, + "voxel_color": [ + 0.5, + 0.65, + 0.9 + ], + "objects": [ + { + "symbol": "voxel_0", + "index": 0, + "position_3d": [ + 0, + 0, + 3 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + }, + { + "symbol": "voxel_1", + "index": 1, + "position_3d": [ + 0, + 1, + 3 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + }, + { + "symbol": "voxel_2", + "index": 2, + "position_3d": [ + 1, + 1, + 3 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + }, + { + "symbol": "voxel_3", + "index": 3, + "position_3d": [ + 2, + 1, + 3 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + }, + { + "symbol": "voxel_4", + "index": 4, + "position_3d": [ + 2, + 1, + 2 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + }, + { + "symbol": "voxel_5", + "index": 5, + "position_3d": [ + 2, + 1, + 1 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + }, + { + "symbol": "voxel_6", + "index": 6, + "position_3d": [ + 2, + 1, + 0 + ], + "color": [ + 0.5, + 0.65, + 0.9 + ] + } + ] + }, + "param_hash": "6543e7eaec22dbf1", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/rotation_task/rotation_00000002/prompt.txt b/VBVR-Dataset/rotation_task/rotation_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..865f7e48672b8fa37fe2de18423eab8c0b367282 --- /dev/null +++ b/VBVR-Dataset/rotation_task/rotation_00000002/prompt.txt @@ -0,0 +1 @@ +A 7-block sculpture sits fixed on a table. First frame: Your camera is tilted at 29° elevation, viewing from 70° azimuth. Final frame: Your camera remains at 29° elevation, but rotates horizontally to 250° azimuth. This is a 180-degree rotation Create a smooth video showing the camera's horizontal rotation around the sculpture, and try to maintain the tilted viewing angle throughout. \ No newline at end of file diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/final_frame.png b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4e544151ec525b3e4dada147f8879261d8366851 Binary files /dev/null and b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/final_frame.png differ diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/first_frame.png b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1d0e22d3926389fd937737751c55a3655fc23545 Binary files /dev/null and b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/first_frame.png differ diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/ground_truth.mp4 b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a43fb8f47357eabaeb1abc4130654d186530f1f0 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc972f721e05c49582c8f0e054caec6d03c7e415b0436ebd99c1ea6971b298d +size 208057 diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/metadata.json b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..182311e42af644f2ea63fe04799ac33f0061c4cc --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "select_box_with_most_dots_00000000", + "generator": "select_box_with_most_dots", + "timestamp": "2026-02-17T06:54:07.914015", + "parameters": { + "boxes": [ + { + "type": "rectangle", + "color": [ + 128, + 0, + 128 + ], + "center": [ + 848.5, + 784.5 + ], + "size": [ + 175.0, + 205.0 + ], + "dot_count": 14 + }, + { + "type": "rectangle", + "color": [ + 255, + 140, + 0 + ], + "center": [ + 419.0, + 296.5 + ], + "size": [ + 300.0, + 205.0 + ], + "dot_count": 13 + }, + { + "type": "rectangle", + "color": [ + 249, + 115, + 22 + ], + "center": [ + 501.0, + 561.5 + ], + "size": [ + 250.0, + 205.0 + ], + "dot_count": 10 + } + ], + "target_index": 0 + }, + "param_hash": "10d89fb5fc50f664", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/prompt.txt b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ea242f8469dd44e9a76f23c74edd977de836903 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000000/prompt.txt @@ -0,0 +1 @@ +There are 3 rectangular boxes on the canvas, each containing some small dots. First count the dots in each box, then circle the single box with the most dots. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/final_frame.png b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1aaf81d2e1784c28121e3f387185d655ac785a6e Binary files /dev/null and b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/final_frame.png differ diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/first_frame.png b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5b10f5438b0620aec360e5805e96f073606bfb55 Binary files /dev/null and b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/first_frame.png differ diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/ground_truth.mp4 b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4404e626d28bb38125bd79d94b835160aea80850 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8bc6b59ff7e810112a0e0f986789fa8e31878cc6f53d2928be132d494fd70e2 +size 206236 diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/metadata.json b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ab8c6b79adcb66e66ebe5bdd934cadd554ff0ceb --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "select_box_with_most_dots_00000001", + "generator": "select_box_with_most_dots", + "timestamp": "2026-02-17T06:54:08.598063", + "parameters": { + "boxes": [ + { + "type": "rectangle", + "color": [ + 249, + 115, + 22 + ], + "center": [ + 618.0, + 183.5 + ], + "size": [ + 290.0, + 165.0 + ], + "dot_count": 6 + }, + { + "type": "rectangle", + "color": [ + 75, + 0, + 130 + ], + "center": [ + 268.5, + 601.5 + ], + "size": [ + 275.0, + 195.0 + ], + "dot_count": 15 + }, + { + "type": "rectangle", + "color": [ + 255, + 105, + 180 + ], + "center": [ + 691.5, + 443.0 + ], + "size": [ + 255.0, + 150.0 + ], + "dot_count": 10 + } + ], + "target_index": 1 + }, + "param_hash": "594e2fe734601dfb", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/prompt.txt b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ea242f8469dd44e9a76f23c74edd977de836903 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000001/prompt.txt @@ -0,0 +1 @@ +There are 3 rectangular boxes on the canvas, each containing some small dots. First count the dots in each box, then circle the single box with the most dots. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/final_frame.png b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1361f8e4449b7315ed0a9ca022461a9568ce040d Binary files /dev/null and b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/final_frame.png differ diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/first_frame.png b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8ce0942b0463f86962fb91591c8df0be1d436357 Binary files /dev/null and b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/first_frame.png differ diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/ground_truth.mp4 b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c5cdc1532627406dd275c8b0986c8574053f9ce1 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:406b2f9f69eeee9da453a7035d2195f41f4faf2cdaad5be3495a2cea0ba893cc +size 195996 diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/metadata.json b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..e304f16e2ca8dd48e029f19ba4cd527cbc9395e4 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/metadata.json @@ -0,0 +1,71 @@ +{ + "task_id": "select_box_with_most_dots_00000002", + "generator": "select_box_with_most_dots", + "timestamp": "2026-02-17T06:54:09.272607", + "parameters": { + "boxes": [ + { + "type": "rectangle", + "color": [ + 75, + 0, + 130 + ], + "center": [ + 517.0, + 661.0 + ], + "size": [ + 150.0, + 170.0 + ], + "dot_count": 4 + }, + { + "type": "rectangle", + "color": [ + 64, + 224, + 208 + ], + "center": [ + 399.0, + 344.5 + ], + "size": [ + 250.0, + 205.0 + ], + "dot_count": 14 + }, + { + "type": "rectangle", + "color": [ + 99, + 102, + 241 + ], + "center": [ + 870.0, + 270.0 + ], + "size": [ + 180.0, + 250.0 + ], + "dot_count": 8 + } + ], + "target_index": 1 + }, + "param_hash": "3e7db4b192c989d0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/prompt.txt b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6ea242f8469dd44e9a76f23c74edd977de836903 --- /dev/null +++ b/VBVR-Dataset/select_box_with_most_dots_task/select_box_with_most_dots_00000002/prompt.txt @@ -0,0 +1 @@ +There are 3 rectangular boxes on the canvas, each containing some small dots. First count the dots in each box, then circle the single box with the most dots. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/final_frame.png b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..217320403f1cd3714e6e362f66066b7a707eaffc Binary files /dev/null and b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/final_frame.png differ diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/first_frame.png b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c7a17ed8940d3ec92d5d9ecc42d349aaab7ef096 Binary files /dev/null and b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/first_frame.png differ diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/ground_truth.mp4 b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c840d0018cc843b5c13ea2f85903a1ba805178c6 --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d40005ee61c7bcc48f453433b74ff31e902b63f71275d8e8fd0dc6d612a29d +size 182396 diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/metadata.json b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe4ec13239630eea352a2c85c576418e67bd22d --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/metadata.json @@ -0,0 +1,59 @@ +{ + "task_id": "select_nearest_2_1_rectangle_00000000", + "generator": "select_nearest_2_1_rectangle", + "timestamp": "2026-02-17T07:05:51.915660", + "parameters": { + "rectangles": [ + { + "width": 84, + "height": 164, + "color": [ + 255, + 105, + 180 + ], + "position": [ + 394, + 370 + ] + }, + { + "width": 200, + "height": 220, + "color": [ + 26, + 188, + 156 + ], + "position": [ + 569, + 407 + ] + }, + { + "width": 201, + "height": 166, + "color": [ + 100, + 149, + 237 + ], + "position": [ + 462, + 767 + ] + } + ], + "closest_rect_index": 0 + }, + "param_hash": "2174ee5e0513a073", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/prompt.txt b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..79a7c9535c3e1f8a4dfa81966cfccad81a22757a --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows several rectangles with different widths and heights. A rectangle matches a 2:1 aspect ratio if its longer side is about twice its shorter side, regardless of orientation. First compare all rectangles and determine which single rectangle is closest to a 2:1 aspect ratio, then draw one red circle around that rectangle. Do not circle any other rectangles. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/final_frame.png b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a0e4e281f92f7cc6eecb4979d51bcc5b2158b662 Binary files /dev/null and b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/final_frame.png differ diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/first_frame.png b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7bc6841dfb899dc13dbc980d5ade397d7f451d15 Binary files /dev/null and b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/first_frame.png differ diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/ground_truth.mp4 b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a701edaae791a1e6a4a2a21972f913e675a211b4 --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0b2c46f4eb93d48d4c065e1edab9a0213fa1aee8974622ae90db0319d89c8da +size 192630 diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/metadata.json b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b27d533c3b19d6b9d1a76743b022df549deb7d26 --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_nearest_2_1_rectangle_00000001", + "generator": "select_nearest_2_1_rectangle", + "timestamp": "2026-02-17T07:05:52.422563", + "parameters": { + "rectangles": [ + { + "width": 162, + "height": 122, + "color": [ + 255, + 165, + 0 + ], + "position": [ + 209, + 386 + ] + }, + { + "width": 175, + "height": 214, + "color": [ + 147, + 112, + 219 + ], + "position": [ + 492, + 662 + ] + }, + { + "width": 155, + "height": 117, + "color": [ + 155, + 89, + 182 + ], + "position": [ + 765, + 233 + ] + }, + { + "width": 144, + "height": 175, + "color": [ + 100, + 149, + 237 + ], + "position": [ + 724, + 636 + ] + }, + { + "width": 172, + "height": 84, + "color": [ + 230, + 126, + 34 + ], + "position": [ + 568, + 250 + ] + } + ], + "closest_rect_index": 4 + }, + "param_hash": "36590737a45e63c5", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/prompt.txt b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..79a7c9535c3e1f8a4dfa81966cfccad81a22757a --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows several rectangles with different widths and heights. A rectangle matches a 2:1 aspect ratio if its longer side is about twice its shorter side, regardless of orientation. First compare all rectangles and determine which single rectangle is closest to a 2:1 aspect ratio, then draw one red circle around that rectangle. Do not circle any other rectangles. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/final_frame.png b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c6400772a3096a7f6171e5e4bf2f7da5c1b73fe7 Binary files /dev/null and b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/final_frame.png differ diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/first_frame.png b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..cba52dd4bdc15d773aaa977d8e89d4a262b55002 Binary files /dev/null and b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/first_frame.png differ diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/ground_truth.mp4 b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0098787863920495d83f3a7c27cb0f424b0fbbea --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2906409fe569155ec53149febf6c15621409cb46d088fee9064d5bb56ccb4d70 +size 195177 diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/metadata.json b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0c14e99b4159ef8d86e39c4c30161507d2fc2fce --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_nearest_2_1_rectangle_00000002", + "generator": "select_nearest_2_1_rectangle", + "timestamp": "2026-02-17T07:05:52.912562", + "parameters": { + "rectangles": [ + { + "width": 218, + "height": 80, + "color": [ + 52, + 73, + 94 + ], + "position": [ + 689, + 728 + ] + }, + { + "width": 185, + "height": 136, + "color": [ + 255, + 105, + 180 + ], + "position": [ + 147, + 768 + ] + }, + { + "width": 89, + "height": 180, + "color": [ + 26, + 188, + 156 + ], + "position": [ + 427, + 466 + ] + }, + { + "width": 220, + "height": 185, + "color": [ + 255, + 165, + 0 + ], + "position": [ + 400, + 790 + ] + }, + { + "width": 175, + "height": 220, + "color": [ + 50, + 205, + 50 + ], + "position": [ + 153, + 394 + ] + } + ], + "closest_rect_index": 2 + }, + "param_hash": "9ec96f1b549e9c58", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/prompt.txt b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..79a7c9535c3e1f8a4dfa81966cfccad81a22757a --- /dev/null +++ b/VBVR-Dataset/select_nearest_2_1_rectangle_task/select_nearest_2_1_rectangle_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows several rectangles with different widths and heights. A rectangle matches a 2:1 aspect ratio if its longer side is about twice its shorter side, regardless of orientation. First compare all rectangles and determine which single rectangle is closest to a 2:1 aspect ratio, then draw one red circle around that rectangle. Do not circle any other rectangles. Show the complete solution step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/final_frame.png b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c1da3ac3446a98aa1fe8942f0c48d09a708d14d1 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/first_frame.png b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..fa6cbea5808490fedb56444eee8552b5e5302637 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..59dcae84cc1cda82d9042c864eadff57bbaefd4c --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86934f077cf604c297a09b0b477c14bcda28c0b0b452e10cd918a9849b0ce06 +size 189756 diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/metadata.json b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6deb883e53ea0a447aff392d337773a4edf16e88 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_decreasing_size_sequence_00000000", + "generator": "select_next_figure_decreasing_size_sequence", + "timestamp": "2026-02-17T06:49:25.609705", + "parameters": { + "sequence": [ + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 155 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 118 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 81 + } + ], + "candidates": [ + { + "shape": "circle", + "color": [ + 138, + 43, + 226 + ], + "size": 44 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 44 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 118 + }, + { + "shape": "diamond", + "color": [ + 199, + 21, + 133 + ], + "size": 44 + } + ], + "correct_index": 1 + }, + "param_hash": "b8fd6292485d7ec3", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/prompt.txt b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f8ed85eed0cc03513bdc6b64f165241d72c9f15 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000000/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly decrease from left to right. First identify the constant size step between consecutive sequence shapes, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and size-decrease pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/final_frame.png b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..25df3edb224c10146cb9ceb31a556709d5a64e07 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/first_frame.png b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..275cbfc1bb4d9ed57861b745c8e8ece1ebe626d4 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2ca89fe082886f56706da7a365cb6c8be9385220 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42a3f1f6306bb627822b3349946c7125776f70aea344bd0b5d1b4114ca7308f4 +size 228173 diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/metadata.json b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5823112da112aa01494fd63797c8aef36348ebe5 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_decreasing_size_sequence_00000001", + "generator": "select_next_figure_decreasing_size_sequence", + "timestamp": "2026-02-17T06:49:26.261376", + "parameters": { + "sequence": [ + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 152 + }, + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 129 + }, + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 106 + } + ], + "candidates": [ + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 106 + }, + { + "shape": "diamond", + "color": [ + 165, + 42, + 42 + ], + "size": 83 + }, + { + "shape": "hexagon", + "color": [ + 0, + 170, + 0 + ], + "size": 83 + }, + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 83 + } + ], + "correct_index": 3 + }, + "param_hash": "db88929ec0054727", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/prompt.txt b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f8ed85eed0cc03513bdc6b64f165241d72c9f15 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000001/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly decrease from left to right. First identify the constant size step between consecutive sequence shapes, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and size-decrease pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/final_frame.png b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..906d3bd4624d2957ee787853e5a950c9d7f82027 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/first_frame.png b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..eb56921defed06512cd4f47a9de4886863f57546 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..679a83e17e9f5edfbf18d33871a6f2d9375b1269 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d7eb1b14bf0fef5e59376e8f472756f09b021c1abec003fd61223e692618dc +size 177965 diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/metadata.json b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4eb6b95e043d12c4e2ecee3f0b0270cf8588c95c --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_decreasing_size_sequence_00000002", + "generator": "select_next_figure_decreasing_size_sequence", + "timestamp": "2026-02-17T06:49:26.939275", + "parameters": { + "sequence": [ + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 119 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 95 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 71 + } + ], + "candidates": [ + { + "shape": "square", + "color": [ + 0, + 255, + 200 + ], + "size": 47 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 95 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 47 + }, + { + "shape": "hexagon", + "color": [ + 50, + 205, + 50 + ], + "size": 47 + } + ], + "correct_index": 2 + }, + "param_hash": "924e26ded11c035c", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/prompt.txt b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..5f8ed85eed0cc03513bdc6b64f165241d72c9f15 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_decreasing_size_sequence_task/select_next_figure_decreasing_size_sequence_00000002/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly decrease from left to right. First identify the constant size step between consecutive sequence shapes, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and size-decrease pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/final_frame.png b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..cbe5485bfd0031d9a977935afc5d7154a0d69f01 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/first_frame.png b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..677cb006eceb43aac3eb1be2355016703141722f Binary files /dev/null and b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..8158ff6cdc2031a277f17a67caabd00f67df6f8f --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb0b651f86b3fc18891829ca920acbcf198a89c200631301c03cbf7e7e4d615 +size 254766 diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/metadata.json b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bc2eca39771b4eca27ab9bd701a80e6b01ad01ec --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_increasing_size_sequence_00000000", + "generator": "select_next_figure_increasing_size_sequence", + "timestamp": "2026-02-17T06:48:27.927956", + "parameters": { + "sequence": [ + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 58 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 81 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 104 + } + ], + "candidates": [ + { + "shape": "circle", + "color": [ + 138, + 43, + 226 + ], + "size": 127 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 127 + }, + { + "shape": "circle", + "color": [ + 199, + 21, + 133 + ], + "size": 81 + }, + { + "shape": "diamond", + "color": [ + 199, + 21, + 133 + ], + "size": 127 + } + ], + "correct_index": 1 + }, + "param_hash": "ed2d16a5e560c768", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/prompt.txt b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..37a0e42bc4c63b5353f1c06e077d67afada838fe --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000000/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly increase from left to right. First identify the constant size step between consecutive sequence shapes, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and size-increase pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/final_frame.png b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6bebb5a92c2004a5f3d0e224b5a0a66686051619 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/first_frame.png b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3f11601610731661f62823b96a72ac4128fec2cd Binary files /dev/null and b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..988b276db91ffdc8bc6865ada50bdb7c1826ecc0 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4a088213c288b13ceedc8238c35aa9305034c6c46b5f74384a790372a702cf +size 261403 diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/metadata.json b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3e1514b67ff9a1cd9580181a8f3ba817c6b77b33 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_increasing_size_sequence_00000001", + "generator": "select_next_figure_increasing_size_sequence", + "timestamp": "2026-02-17T06:48:28.607157", + "parameters": { + "sequence": [ + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 31 + }, + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 70 + }, + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 109 + } + ], + "candidates": [ + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 70 + }, + { + "shape": "diamond", + "color": [ + 165, + 42, + 42 + ], + "size": 148 + }, + { + "shape": "hexagon", + "color": [ + 0, + 170, + 0 + ], + "size": 148 + }, + { + "shape": "diamond", + "color": [ + 0, + 170, + 0 + ], + "size": 148 + } + ], + "correct_index": 3 + }, + "param_hash": "475e76e9b84c343b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/prompt.txt b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..37a0e42bc4c63b5353f1c06e077d67afada838fe --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000001/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly increase from left to right. First identify the constant size step between consecutive sequence shapes, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and size-increase pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/final_frame.png b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7cc9ec1c6e3344e3409dfeb5d5432bee7f1ecb6a Binary files /dev/null and b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/first_frame.png b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..770b5ebc668b51dd307995c85b3cf9673f2d518f Binary files /dev/null and b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..57cb4009bb37088d5a9affe05eb27365f95fc882 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348f58060354ebff58170276eb01724d3be2f53c9767208ef2db46c861034c58 +size 216170 diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/metadata.json b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9acefef54a77834d089a5cf36622de835e969ef9 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_increasing_size_sequence_00000002", + "generator": "select_next_figure_increasing_size_sequence", + "timestamp": "2026-02-17T06:48:29.276575", + "parameters": { + "sequence": [ + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 33 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 54 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 75 + } + ], + "candidates": [ + { + "shape": "square", + "color": [ + 0, + 255, + 200 + ], + "size": 96 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 54 + }, + { + "shape": "square", + "color": [ + 50, + 205, + 50 + ], + "size": 96 + }, + { + "shape": "hexagon", + "color": [ + 50, + 205, + 50 + ], + "size": 96 + } + ], + "correct_index": 2 + }, + "param_hash": "892e2f5999992ecc", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/prompt.txt b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..37a0e42bc4c63b5353f1c06e077d67afada838fe --- /dev/null +++ b/VBVR-Dataset/select_next_figure_increasing_size_sequence_task/select_next_figure_increasing_size_sequence_00000002/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly increase from left to right. First identify the constant size step between consecutive sequence shapes, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and size-increase pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/final_frame.png b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b99afc12164ed5fce5ece17b2817f49b9ae2273a Binary files /dev/null and b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/first_frame.png b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d6653fc5a37dc5111257c0ce64295de274dbf207 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5045ab1fb7bc7cd5a8abf8185573fa247a5f5a4b --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13fce13d453896c02728b5c82a32279cf9d832c6f841c6f773fff9c727b353b2 +size 223464 diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/metadata.json b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..88ea77e9686de75619c47e1aa50bc08eef275a39 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_large_small_alternating_sequence_00000000", + "generator": "select_next_figure_large_small_alternating_sequence", + "timestamp": "2026-02-17T06:49:51.596573", + "parameters": { + "sequence": [ + { + "shape": "square", + "color": [ + 255, + 193, + 7 + ], + "size": 40 + }, + { + "shape": "square", + "color": [ + 255, + 193, + 7 + ], + "size": 80 + }, + { + "shape": "square", + "color": [ + 255, + 193, + 7 + ], + "size": 40 + } + ], + "candidates": [ + { + "shape": "hexagon", + "color": [ + 255, + 193, + 7 + ], + "size": 80 + }, + { + "shape": "square", + "color": [ + 255, + 193, + 7 + ], + "size": 40 + }, + { + "shape": "square", + "color": [ + 255, + 193, + 7 + ], + "size": 80 + }, + { + "shape": "square", + "color": [ + 35, + 35, + 35 + ], + "size": 80 + } + ], + "correct_index": 2 + }, + "param_hash": "ab575ce3ca686479", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/prompt.txt b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6441d8ba862bce2a96a6b6cad40cc20eddc22f9 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000000/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly alternate between LARGE and SMALL from left to right. First observe the size-alternation pattern and determine whether the next item should be LARGE or SMALL, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and large/small alternation pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/final_frame.png b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8d68ba7c41439adce4d97e591df8fe98746d2c04 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/first_frame.png b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..691b83dbe9ed177db1e001bf2e66f417a0d72634 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..1e69c6f4fdc15206b5ee14050685f06db4bce843 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428f348712223df0a306ceb8154c2110b7be254149188de955ad90684a615aa9 +size 236038 diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/metadata.json b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..89e7906bd2ab2a607a7bd3e23d91ad4164bb2306 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_large_small_alternating_sequence_00000001", + "generator": "select_next_figure_large_small_alternating_sequence", + "timestamp": "2026-02-17T06:49:52.317110", + "parameters": { + "sequence": [ + { + "shape": "circle", + "color": [ + 203, + 75, + 22 + ], + "size": 50 + }, + { + "shape": "circle", + "color": [ + 203, + 75, + 22 + ], + "size": 120 + }, + { + "shape": "circle", + "color": [ + 203, + 75, + 22 + ], + "size": 50 + } + ], + "candidates": [ + { + "shape": "circle", + "color": [ + 203, + 75, + 22 + ], + "size": 50 + }, + { + "shape": "circle", + "color": [ + 35, + 35, + 35 + ], + "size": 120 + }, + { + "shape": "pentagon", + "color": [ + 203, + 75, + 22 + ], + "size": 120 + }, + { + "shape": "circle", + "color": [ + 203, + 75, + 22 + ], + "size": 120 + } + ], + "correct_index": 3 + }, + "param_hash": "3b7e9e8d7af4d204", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/prompt.txt b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6441d8ba862bce2a96a6b6cad40cc20eddc22f9 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000001/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly alternate between LARGE and SMALL from left to right. First observe the size-alternation pattern and determine whether the next item should be LARGE or SMALL, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and large/small alternation pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/final_frame.png b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..591f30e5a00ff24e28b970446ee1e2b7d8b52d0b Binary files /dev/null and b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/final_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/first_frame.png b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5c19ab563ec5763d373c697171def10920e5c550 Binary files /dev/null and b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/first_frame.png differ diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/ground_truth.mp4 b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..d1f0de5161425021fbd9c5ed45985e437a26369a --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02ca93648871a8801feece264cf66bf18651a83ae0d419eb05b540f02963734 +size 242661 diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/metadata.json b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b74ad1e156c9f4c992f5a88bb7d1123187474082 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "select_next_figure_large_small_alternating_sequence_00000002", + "generator": "select_next_figure_large_small_alternating_sequence", + "timestamp": "2026-02-17T06:49:52.900058", + "parameters": { + "sequence": [ + { + "shape": "circle", + "color": [ + 0, + 128, + 128 + ], + "size": 130 + }, + { + "shape": "circle", + "color": [ + 0, + 128, + 128 + ], + "size": 50 + }, + { + "shape": "circle", + "color": [ + 0, + 128, + 128 + ], + "size": 130 + } + ], + "candidates": [ + { + "shape": "circle", + "color": [ + 0, + 128, + 128 + ], + "size": 50 + }, + { + "shape": "pentagon", + "color": [ + 0, + 128, + 128 + ], + "size": 50 + }, + { + "shape": "circle", + "color": [ + 0, + 128, + 128 + ], + "size": 130 + }, + { + "shape": "circle", + "color": [ + 211, + 54, + 130 + ], + "size": 50 + } + ], + "correct_index": 0 + }, + "param_hash": "df07f59828e1344f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/prompt.txt b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c6441d8ba862bce2a96a6b6cad40cc20eddc22f9 --- /dev/null +++ b/VBVR-Dataset/select_next_figure_large_small_alternating_sequence_task/select_next_figure_large_small_alternating_sequence_00000002/prompt.txt @@ -0,0 +1 @@ +The scene has two separated areas: a top SEQUENCE area and a bottom CHOICES area. In the SEQUENCE area, the shapes are the same shape and the same color, and their sizes strictly alternate between LARGE and SMALL from left to right. First observe the size-alternation pattern and determine whether the next item should be LARGE or SMALL, then select the one correct option (out of 4) in the CHOICES area that continues the same shape, color, and large/small alternation pattern. Circle the correct option and show the full process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/final_frame.png b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..cba9b114e90a4139f27b230ba7667f03a8906e4b Binary files /dev/null and b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/final_frame.png differ diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/first_frame.png b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..517985e5d0a77294f6759a72351931322ebc6d13 Binary files /dev/null and b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/first_frame.png differ diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/ground_truth.mp4 b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4966b171d38ec19863fd2b2625d25cd814695434 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6c1fb1226e117bf85b4607d82e498e9692dcef24556631132556dc84fe06ae +size 256456 diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/metadata.json b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..522934380a89c1bc48181748a9d41d13046f7000 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "seperate_object_spinning_00000000", + "generator": "seperate_object_spinning", + "timestamp": "2026-02-17T07:17:44.520952", + "parameters": { + "objects": [ + { + "id": 0, + "shape": "triangle", + "color": [ + 255, + 100, + 100 + ], + "size": 140, + "start_angle": 3, + "end_angle": -3, + "start_center": [ + 189.154745, + 532.809435 + ], + "end_center": [ + 675.708349, + 532.809435 + ] + }, + { + "id": 1, + "shape": "diamond", + "color": [ + 200, + 140, + 220 + ], + "size": 65, + "start_angle": -18, + "end_angle": 15, + "start_center": [ + 390.581341, + 532.809435 + ], + "end_center": [ + 866.740913, + 532.809435 + ] + }, + { + "id": 2, + "shape": "hexagon", + "color": [ + 128, + 0, + 128 + ], + "size": 58, + "start_angle": 15, + "end_angle": 7, + "start_center": [ + 379.395827, + 408.950107 + ], + "end_center": [ + 866.740913, + 408.950107 + ] + } + ] + }, + "param_hash": "5af9e7c96c5c852b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/prompt.txt b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ac70fe50c054bcec56e7a7469fa08935fdb4c32 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 objects on the left side and dashed target outlines on the right side. The dashed target outlines remain completely stationary. For each object, first rotate it in place to match the orientation of its corresponding dashed target outline, then move it horizontally to the right so that it aligns exactly with and fits within its corresponding dashed target outline. \ No newline at end of file diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/final_frame.png b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..642bd4d36b6a4d083fc0175df9c70e9230495230 Binary files /dev/null and b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/final_frame.png differ diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/first_frame.png b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..38bbcf284913850dbf7bad4c90b88182d5b89142 Binary files /dev/null and b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/first_frame.png differ diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/ground_truth.mp4 b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b106156c7b17edd5a8f190490a1055ed899866a8 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49fbab40dee2b8e25e83b08fd8ee479f31be1b669a21ae3fccbb415c71dbeb83 +size 309423 diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/metadata.json b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..934fa085d09ea9687297b30d6a29d7b1b1036927 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/metadata.json @@ -0,0 +1,99 @@ +{ + "task_id": "seperate_object_spinning_00000001", + "generator": "seperate_object_spinning", + "timestamp": "2026-02-17T07:17:45.361222", + "parameters": { + "objects": [ + { + "id": 0, + "shape": "circle", + "color": [ + 230, + 170, + 95 + ], + "size": 84, + "start_angle": 0, + "end_angle": 0, + "start_center": [ + 157.266869, + 560.028143 + ], + "end_center": [ + 637.339269, + 560.028143 + ] + }, + { + "id": 1, + "shape": "hexagon", + "color": [ + 255, + 150, + 50 + ], + "size": 98, + "start_angle": 16, + "end_angle": -15, + "start_center": [ + 346.429795, + 560.028143 + ], + "end_center": [ + 826.0, + 560.028143 + ] + }, + { + "id": 2, + "shape": "circle", + "color": [ + 120, + 175, + 235 + ], + "size": 81, + "start_angle": 0, + "end_angle": 0, + "start_center": [ + 198.528094, + 374.367412 + ], + "end_center": [ + 826.0, + 374.367412 + ] + }, + { + "id": 3, + "shape": "diamond", + "color": [ + 255, + 228, + 196 + ], + "size": 50, + "start_angle": 4, + "end_angle": -5, + "start_center": [ + 167.108657, + 692.330365 + ], + "end_center": [ + 637.339269, + 692.330365 + ] + } + ] + }, + "param_hash": "5770a6ea359cd791", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/prompt.txt b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2d9b03c162b4d15bf95f1c7370a0c41e4f6a64a5 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 objects on the left side and dashed target outlines on the right side. The dashed target outlines remain completely stationary. For each object, first rotate it in place to match the orientation of its corresponding dashed target outline, then move it horizontally to the right so that it aligns exactly with and fits within its corresponding dashed target outline. \ No newline at end of file diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/final_frame.png b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6ec8ca49968a180d3416ead789fb0789e7013c4d Binary files /dev/null and b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/final_frame.png differ diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/first_frame.png b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6ff513df93cc0839247d4425906eb5cddbb8b8a6 Binary files /dev/null and b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/first_frame.png differ diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/ground_truth.mp4 b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..96ce8404bcd137441ed7b0378f47e1a4acaa88a7 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfd2ba7975ddd7e34c547d9c885bbff0926df51da4272c4d3081eafda63f067 +size 308615 diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/metadata.json b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..b5e5396ba4e7f07ab9d61f6f2b95b3521e3802cf --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/metadata.json @@ -0,0 +1,79 @@ +{ + "task_id": "seperate_object_spinning_00000002", + "generator": "seperate_object_spinning", + "timestamp": "2026-02-17T07:17:45.946128", + "parameters": { + "objects": [ + { + "id": 0, + "shape": "circle", + "color": [ + 255, + 165, + 0 + ], + "size": 64, + "start_angle": 0, + "end_angle": 0, + "start_center": [ + 373.953307, + 610.0 + ], + "end_center": [ + 620.547454, + 610.0 + ] + }, + { + "id": 1, + "shape": "circle", + "color": [ + 100, + 150, + 200 + ], + "size": 93, + "start_angle": 0, + "end_angle": 0, + "start_center": [ + 318.812511, + 395.547454 + ], + "end_center": [ + 806.0, + 395.547454 + ] + }, + { + "id": 2, + "shape": "diamond", + "color": [ + 80, + 255, + 120 + ], + "size": 122, + "start_angle": 1, + "end_angle": 21, + "start_center": [ + 203.847826, + 610.0 + ], + "end_center": [ + 806.0, + 610.0 + ] + } + ] + }, + "param_hash": "403fa0d4dbda69f2", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/prompt.txt b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..7ac70fe50c054bcec56e7a7469fa08935fdb4c32 --- /dev/null +++ b/VBVR-Dataset/seperate_object_spinning_task/seperate_object_spinning_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 objects on the left side and dashed target outlines on the right side. The dashed target outlines remain completely stationary. For each object, first rotate it in place to match the orientation of its corresponding dashed target outline, then move it horizontally to the right so that it aligns exactly with and fits within its corresponding dashed target outline. \ No newline at end of file diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/final_frame.png b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..64d02081ea2ee6da690c3daf0e4aefadc44b061d Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/final_frame.png differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/first_frame.png b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9a4e88e027e9d33e1d51d3e376847acfdcccae53 Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/first_frame.png differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/ground_truth.mp4 b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..635b7d528d3fed8a3edd9b5932a732e5a45247d5 Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/metadata.json b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..82a57432471bb853c51542fa551c5fe13c02020e --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/metadata.json @@ -0,0 +1,116 @@ +{ + "task_id": "sequence_completion_00000000", + "generator": "sequence_completion", + "timestamp": "2026-02-17T07:54:49.061701", + "parameters": { + "task_type": "mixed", + "task_type_id": 8, + "sequence_length": 6, + "answer_index": 5, + "task_params": { + "cycle": [ + "red△", + "blue○", + "green◇" + ], + "length": 6, + "mixed_type": "color_shape" + }, + "objects": [ + { + "symbol": "element_0", + "index": 0, + "position": 0, + "center": [ + 146.29, + 512.0 + ], + "type": "mixed", + "value": "red△", + "is_answer": false, + "shape": "△", + "color": "red" + }, + { + "symbol": "element_1", + "index": 1, + "position": 1, + "center": [ + 292.57, + 512.0 + ], + "type": "mixed", + "value": "blue○", + "is_answer": false, + "shape": "○", + "color": "blue" + }, + { + "symbol": "element_2", + "index": 2, + "position": 2, + "center": [ + 438.86, + 512.0 + ], + "type": "mixed", + "value": "green◇", + "is_answer": false, + "shape": "◇", + "color": "green" + }, + { + "symbol": "element_3", + "index": 3, + "position": 3, + "center": [ + 585.14, + 512.0 + ], + "type": "mixed", + "value": "red△", + "is_answer": false, + "shape": "△", + "color": "red" + }, + { + "symbol": "element_4", + "index": 4, + "position": 4, + "center": [ + 731.43, + 512.0 + ], + "type": "mixed", + "value": "blue○", + "is_answer": false, + "shape": "○", + "color": "blue" + }, + { + "symbol": "element_5", + "index": 5, + "position": 5, + "center": [ + 877.71, + 512.0 + ], + "type": "mixed", + "value": "green◇", + "is_answer": true, + "shape": "◇", + "color": "green" + } + ] + }, + "param_hash": "116522b6602549d7", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/prompt.txt b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fcee6cfcd641094d78f0ace7eaa8cf189513cecc --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a mixed sequence. Elements are arranged horizontally from left to right. The last position contains a question mark (?) indicating a missing element. Observe the pattern: both colors and shapes follow combined cyclic orders. Determine the element that should replace the question mark to complete the sequence according to the established pattern. \ No newline at end of file diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/final_frame.png b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..42c2b38a970ff8d70c3dec8a37444c0ac64330b2 Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/final_frame.png differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/first_frame.png b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8b7c325aff2f35e38bb117840e261c800cd98d8e Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/first_frame.png differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/ground_truth.mp4 b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..94dff38c4906169c64120a2ae42ca92eb231e82a --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408e4080b3a528ea66f67a1fda68cb9952f4b72ae1e70bf999944e335a866e32 +size 141105 diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/metadata.json b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..69ce27fd068ddd891cd5f86e034f5d6e0178132b --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/metadata.json @@ -0,0 +1,112 @@ +{ + "task_id": "sequence_completion_00000001", + "generator": "sequence_completion", + "timestamp": "2026-02-17T07:54:50.004092", + "parameters": { + "task_type": "fibonacci", + "task_type_id": 4, + "sequence_length": 7, + "answer_index": 6, + "task_params": { + "first": 5, + "second": 4, + "length": 7 + }, + "objects": [ + { + "symbol": "element_0", + "index": 0, + "position": 0, + "center": [ + 128.0, + 512.0 + ], + "type": "number", + "value": 5, + "is_answer": false + }, + { + "symbol": "element_1", + "index": 1, + "position": 1, + "center": [ + 256.0, + 512.0 + ], + "type": "number", + "value": 4, + "is_answer": false + }, + { + "symbol": "element_2", + "index": 2, + "position": 2, + "center": [ + 384.0, + 512.0 + ], + "type": "number", + "value": 9, + "is_answer": false + }, + { + "symbol": "element_3", + "index": 3, + "position": 3, + "center": [ + 512.0, + 512.0 + ], + "type": "number", + "value": 13, + "is_answer": false + }, + { + "symbol": "element_4", + "index": 4, + "position": 4, + "center": [ + 640.0, + 512.0 + ], + "type": "number", + "value": 22, + "is_answer": false + }, + { + "symbol": "element_5", + "index": 5, + "position": 5, + "center": [ + 768.0, + 512.0 + ], + "type": "number", + "value": 35, + "is_answer": false + }, + { + "symbol": "element_6", + "index": 6, + "position": 6, + "center": [ + 896.0, + 512.0 + ], + "type": "number", + "value": 57, + "is_answer": true + } + ] + }, + "param_hash": "dfbdc208dab37044", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/prompt.txt b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6790155cb041378d90fccf0550220953b4b30bc8 --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a fibonacci sequence. Elements are arranged horizontally from left to right. The last position contains a question mark (?) indicating a missing element. Observe the pattern: each number is the sum of the two immediately preceding numbers. Determine the element that should replace the question mark to complete the sequence according to the established pattern. \ No newline at end of file diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/final_frame.png b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..654835b6b5101abc93add045c12cee6004edabed Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/final_frame.png differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/first_frame.png b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..067a155d4dd292213fc8371ea265b127e9eb15a2 Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/first_frame.png differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/ground_truth.mp4 b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..66d0e84cc3cb5efc4bb978263369fdd7816905bc Binary files /dev/null and b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/metadata.json b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6fc71cf178d483ce8a8218402798fef77bae545a --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/metadata.json @@ -0,0 +1,174 @@ +{ + "task_id": "sequence_completion_00000000", + "generator": "sequence_completion", + "timestamp": "2026-02-19T02:36:41.021838", + "parameters": { + "task_type": "color_cycle", + "task_type_id": 6, + "sequence_length": 6, + "answer_index": 5, + "task_params": { + "cycle": [ + [ + 152, + 251, + 152 + ], + [ + 173, + 216, + 230 + ], + [ + 188, + 143, + 143 + ], + [ + 210, + 105, + 30 + ] + ], + "length": 6 + }, + "objects": [ + { + "symbol": "element_0", + "index": 0, + "position": 0, + "center": [ + 146.29, + 512.0 + ], + "type": "color", + "value": [ + 152, + 251, + 152 + ], + "is_answer": false, + "color": [ + 152, + 251, + 152 + ] + }, + { + "symbol": "element_1", + "index": 1, + "position": 1, + "center": [ + 292.57, + 512.0 + ], + "type": "color", + "value": [ + 173, + 216, + 230 + ], + "is_answer": false, + "color": [ + 173, + 216, + 230 + ] + }, + { + "symbol": "element_2", + "index": 2, + "position": 2, + "center": [ + 438.86, + 512.0 + ], + "type": "color", + "value": [ + 188, + 143, + 143 + ], + "is_answer": false, + "color": [ + 188, + 143, + 143 + ] + }, + { + "symbol": "element_3", + "index": 3, + "position": 3, + "center": [ + 585.14, + 512.0 + ], + "type": "color", + "value": [ + 210, + 105, + 30 + ], + "is_answer": false, + "color": [ + 210, + 105, + 30 + ] + }, + { + "symbol": "element_4", + "index": 4, + "position": 4, + "center": [ + 731.43, + 512.0 + ], + "type": "color", + "value": [ + 152, + 251, + 152 + ], + "is_answer": false, + "color": [ + 152, + 251, + 152 + ] + }, + { + "symbol": "element_5", + "index": 5, + "position": 5, + "center": [ + 877.71, + 512.0 + ], + "type": "color", + "value": [ + 173, + 216, + 230 + ], + "is_answer": true, + "color": [ + 173, + 216, + 230 + ] + } + ] + }, + "param_hash": "81ffe815057bc43f", + "generation": { + "seed": 2033916483, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/prompt.txt b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..83f0c51b34df3007d70e22fa773b173e0cf9e98f --- /dev/null +++ b/VBVR-Dataset/sequence_completion_task/sequence_completion_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a color_cycle sequence. Elements are arranged horizontally from left to right. The last position contains a question mark (?) indicating a missing element. Observe the pattern: the colors follow a cyclic order that repeats after a certain number of elements. Determine the element that should replace the question mark to complete the sequence according to the established pattern. \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/final_frame.png b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..56f8f52953c04517661856ee9d5c0cbb74027afc Binary files /dev/null and b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/final_frame.png differ diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/first_frame.png b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b389042a20f6003f81566907ec92044d06b1252c Binary files /dev/null and b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/first_frame.png differ diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/ground_truth.mp4 b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..db86e471c515077ee6e2360f433d679c1c1833b8 --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ed90abeab97b988df05af67a751c7989a5e2b87a61079cded877c537055010 +size 132218 diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/metadata.json b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..be89f3945277d58f9968afaf2da3143c2d8a9306 --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "shape_color_change_00000000", + "generator": "shape_color_change", + "timestamp": "2026-02-17T08:07:55.002186", + "parameters": { + "transformation_type": "color_change", + "source_color": [ + 153, + 7, + 7 + ], + "target_color": [ + 70, + 130, + 180 + ], + "objects": [ + { + "symbol": "rectangle", + "center": [ + 255, + 256 + ], + "color": [ + 153, + 7, + 7 + ] + }, + { + "symbol": "rectangle", + "center": [ + 769, + 256 + ], + "color": [ + 70, + 130, + 180 + ] + }, + { + "symbol": "minus", + "center": [ + 255, + 768 + ], + "color": [ + 153, + 7, + 7 + ] + }, + { + "symbol": "minus", + "center": [ + 769, + 768 + ], + "color": [ + 70, + 130, + 180 + ] + } + ] + }, + "param_hash": "2c47e8d0463f609b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/prompt.txt b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e2e7966e9ff685e4f70c32c8b626a4d9c3e5ea70 --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A:B :: C:? with two rows of shapes and arrows. On the top row, a unknown rectangle becomes a steel_blue rectangle; treat this as the color rule from unknown to steel_blue. On the bottom row, the minus starts with the same source color. Apply the same color change so the answer shape on the right is a steel_blue minus, keeping its shape, size, and position the same while only the color changes. \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/final_frame.png b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3d4dec70142f11a8121f87c2c61249e75132316b Binary files /dev/null and b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/final_frame.png differ diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/first_frame.png b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7472fabb917e50b45152397d6164ac7598d2aa7f Binary files /dev/null and b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/first_frame.png differ diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/ground_truth.mp4 b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b1de912bcfc5a40b3788af2049909cefd8f85a94 --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b2c4c90a1a2c3b25ad986085ee51ba1ef918250ca28f40a0cb7727e276ffdb +size 139273 diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/metadata.json b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9932e61fd8e73d13d26f1791bcc4762f61874707 --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "shape_color_change_00000001", + "generator": "shape_color_change", + "timestamp": "2026-02-17T08:07:55.661386", + "parameters": { + "transformation_type": "color_change", + "source_color": [ + 168, + 45, + 229 + ], + "target_color": [ + 114, + 191, + 38 + ], + "objects": [ + { + "symbol": "minus", + "center": [ + 255, + 256 + ], + "color": [ + 168, + 45, + 229 + ] + }, + { + "symbol": "minus", + "center": [ + 769, + 256 + ], + "color": [ + 114, + 191, + 38 + ] + }, + { + "symbol": "cross", + "center": [ + 255, + 768 + ], + "color": [ + 168, + 45, + 229 + ] + }, + { + "symbol": "cross", + "center": [ + 769, + 768 + ], + "color": [ + 114, + 191, + 38 + ] + } + ] + }, + "param_hash": "7d512e1b24c90a63", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/prompt.txt b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb00d11ed8e8fe11a8bcd10a542dfb7b77d9597b --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A:B :: C:? with two rows of shapes and arrows. On the top row, a unknown minus becomes a unknown minus; treat this as the color rule from unknown to unknown. On the bottom row, the cross starts with the same source color. Apply the same color change so the answer shape on the right is a unknown cross, keeping its shape, size, and position the same while only the color changes. \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/final_frame.png b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..07fa8d5ba668804fe24045cc5324fdc69087ed65 Binary files /dev/null and b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/final_frame.png differ diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/first_frame.png b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6d6a9429b9244c2b235e4091ae681f1e8637f4ee Binary files /dev/null and b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/first_frame.png differ diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/ground_truth.mp4 b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..509923cbc068967fefab2cfbd8fcd2590ccce5bb --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cdcd612a1d2174721455e4ecb8c30bcce3582c2f6285354e1ffb233c8dfe0c3 +size 185187 diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/metadata.json b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7511c769b2561d88388f3bc9dbf025895177e885 --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "shape_color_change_00000002", + "generator": "shape_color_change", + "timestamp": "2026-02-17T08:07:56.337961", + "parameters": { + "transformation_type": "color_change", + "source_color": [ + 191, + 100, + 9 + ], + "target_color": [ + 80, + 229, + 105 + ], + "objects": [ + { + "symbol": "octagon", + "center": [ + 255, + 256 + ], + "color": [ + 191, + 100, + 9 + ] + }, + { + "symbol": "octagon", + "center": [ + 769, + 256 + ], + "color": [ + 80, + 229, + 105 + ] + }, + { + "symbol": "arrow", + "center": [ + 255, + 768 + ], + "color": [ + 191, + 100, + 9 + ] + }, + { + "symbol": "arrow", + "center": [ + 769, + 768 + ], + "color": [ + 80, + 229, + 105 + ] + } + ] + }, + "param_hash": "5cfb3192690e0f88", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/prompt.txt b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0cbe33a7fd147cb13393becee24634f02481ca0b --- /dev/null +++ b/VBVR-Dataset/shape_color_change_task/shape_color_change_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A:B :: C:? with two rows of shapes and arrows. On the top row, a unknown octagon becomes a unknown octagon; treat this as the color rule from unknown to unknown. On the bottom row, the arrow starts with the same source color. Apply the same color change so the answer shape on the right is a unknown arrow, keeping its shape, size, and position the same while only the color changes. \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/final_frame.png b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..aaaf4f59dd3b782acabaa3bef8d97f5688ce7bb2 Binary files /dev/null and b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/final_frame.png differ diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/first_frame.png b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..013f351d490201d74354f7ec515eb3455a70b2a5 Binary files /dev/null and b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/first_frame.png differ diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/ground_truth.mp4 b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..940f0936ad4383fd23b21a2202be26294935ab36 --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f9dca2e2d58e91ba9b4476edb03af5cd1b891f01c062a4a05d4f28306974cd +size 173028 diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/metadata.json b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..18d51028c511bc88770a5cdcf07763722d0159ac --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/metadata.json @@ -0,0 +1,102 @@ +{ + "task_id": "shape_color_then_scale_00000000", + "generator": "shape_color_then_scale", + "timestamp": "2026-02-17T07:37:25.565263", + "parameters": { + "transformation_type": "color_then_scale", + "color_from": "color_042", + "color_to": "color_073", + "scale_from": "extra_large", + "scale_to": "large", + "objects": [ + { + "symbol": "rectangle", + "center": [ + 180, + 341 + ], + "color": [ + 229, + 114, + 114 + ], + "scale": 1.8 + }, + { + "symbol": "rectangle", + "center": [ + 518, + 341 + ], + "color": [ + 153, + 56, + 7 + ], + "scale": 1.8 + }, + { + "symbol": "rectangle", + "center": [ + 856, + 341 + ], + "color": [ + 153, + 56, + 7 + ], + "scale": 1.4 + }, + { + "symbol": "minus", + "center": [ + 180, + 682 + ], + "color": [ + 229, + 114, + 114 + ], + "scale": 1.8 + }, + { + "symbol": "minus", + "center": [ + 518, + 682 + ], + "color": [ + 153, + 56, + 7 + ], + "scale": 1.8 + }, + { + "symbol": "minus", + "center": [ + 856, + 682 + ], + "color": [ + 153, + 56, + 7 + ], + "scale": 1.4 + } + ] + }, + "param_hash": "0a4f580e8d123526", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/prompt.txt b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..a408b5ef7e0a053797525dd5ad0afb3cf8155dc8 --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A→B→C :: D→?→? with two rows of shapes. Top row: color_042 rectangle at extra_large becomes color_073 rectangle at extra_large, then color_073 rectangle at large. This shows two rules: first change color from color_042 to color_073, then change size from extra_large to large. Bottom row: minus starts with color_042 and extra_large. Apply the same transformation: first change color to color_073, then change size to large. \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/final_frame.png b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5b9e402dce93c8a33369cc42817e50853a96ad66 Binary files /dev/null and b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/final_frame.png differ diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/first_frame.png b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6386e0d6e6b5f5a8c3a0bc3d4224b1bd15948115 Binary files /dev/null and b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/first_frame.png differ diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/ground_truth.mp4 b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..fc21f7790159f43e6eeda21d0d13d1190c5a1baf --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6bce55b5181fd97d805cbcdb79404eb40f66d4ce9952cbc47636e3727f8c194 +size 190261 diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/metadata.json b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..c192e07890f444620125588db8460efce047da6e --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/metadata.json @@ -0,0 +1,102 @@ +{ + "task_id": "shape_color_then_scale_00000001", + "generator": "shape_color_then_scale", + "timestamp": "2026-02-17T07:37:26.232259", + "parameters": { + "transformation_type": "color_then_scale", + "color_from": "color_283", + "color_to": "color_090", + "scale_from": "extra_large", + "scale_to": "small", + "objects": [ + { + "symbol": "circle", + "center": [ + 180, + 341 + ], + "color": [ + 53, + 119, + 153 + ], + "scale": 1.8 + }, + { + "symbol": "circle", + "center": [ + 518, + 341 + ], + "color": [ + 229, + 191, + 114 + ], + "scale": 1.8 + }, + { + "symbol": "circle", + "center": [ + 856, + 341 + ], + "color": [ + 229, + 191, + 114 + ], + "scale": 0.7 + }, + { + "symbol": "minus", + "center": [ + 180, + 682 + ], + "color": [ + 53, + 119, + 153 + ], + "scale": 1.8 + }, + { + "symbol": "minus", + "center": [ + 518, + 682 + ], + "color": [ + 229, + 191, + 114 + ], + "scale": 1.8 + }, + { + "symbol": "minus", + "center": [ + 856, + 682 + ], + "color": [ + 229, + 191, + 114 + ], + "scale": 0.7 + } + ] + }, + "param_hash": "5ed8b3d95423e754", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/prompt.txt b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d48d7f8d6bcfca38a98fd2fe3eaf599f4f9db7a --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A→B→C :: D→?→? with two rows of shapes. Top row: color_283 circle at extra_large becomes color_090 circle at extra_large, then color_090 circle at small. This shows two rules: first change color from color_283 to color_090, then change size from extra_large to small. Bottom row: minus starts with color_283 and extra_large. Apply the same transformation: first change color to color_090, then change size to small. \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/final_frame.png b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c1038caa624821795bf164e8838aeb27c6208560 Binary files /dev/null and b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/final_frame.png differ diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/first_frame.png b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1b6d2c7bb665f8cd9d4bf9615f4bae39b57ae23b Binary files /dev/null and b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/first_frame.png differ diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/ground_truth.mp4 b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3a75c9fd9a38a92feeaa427566a16e63bf75307d --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e60d5ced7376f6ed331a245b6571b7318a4b9f82e401050d2e8ce311dbe54e +size 166548 diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/metadata.json b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f78f748e23381646b33be4a930e726cce21ebaa4 --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/metadata.json @@ -0,0 +1,102 @@ +{ + "task_id": "shape_color_then_scale_00000002", + "generator": "shape_color_then_scale", + "timestamp": "2026-02-17T07:37:26.918051", + "parameters": { + "transformation_type": "color_then_scale", + "color_from": "color_194", + "color_to": "color_336", + "scale_from": "medium", + "scale_to": "small", + "objects": [ + { + "symbol": "cross", + "center": [ + 180, + 341 + ], + "color": [ + 9, + 191, + 9 + ], + "scale": 1.0 + }, + { + "symbol": "cross", + "center": [ + 518, + 341 + ], + "color": [ + 45, + 45, + 229 + ], + "scale": 1.0 + }, + { + "symbol": "cross", + "center": [ + 856, + 341 + ], + "color": [ + 45, + 45, + 229 + ], + "scale": 0.7 + }, + { + "symbol": "heart", + "center": [ + 180, + 682 + ], + "color": [ + 9, + 191, + 9 + ], + "scale": 1.0 + }, + { + "symbol": "heart", + "center": [ + 518, + 682 + ], + "color": [ + 45, + 45, + 229 + ], + "scale": 1.0 + }, + { + "symbol": "heart", + "center": [ + 856, + 682 + ], + "color": [ + 45, + 45, + 229 + ], + "scale": 0.7 + } + ] + }, + "param_hash": "6df9f8ce5186cc17", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/prompt.txt b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..49af84172d90e8690fdbe3328b6857a035fd565d --- /dev/null +++ b/VBVR-Dataset/shape_color_then_scale_task/shape_color_then_scale_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A→B→C :: D→?→? with two rows of shapes. Top row: color_194 cross at medium becomes color_336 cross at medium, then color_336 cross at small. This shows two rules: first change color from color_194 to color_336, then change size from medium to small. Bottom row: heart starts with color_194 and medium. Apply the same transformation: first change color to color_336, then change size to small. \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/final_frame.png b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b4fab9a061b70b71cbd25cad3c8fda2a26fd7213 Binary files /dev/null and b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/final_frame.png differ diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/first_frame.png b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3932257e2ee1f4a15d602aff4d5b871906d5f065 Binary files /dev/null and b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/first_frame.png differ diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/ground_truth.mp4 b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5aafcc26eb1ddbf007e213eda8d303e3ce8bc64b --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d02473a9e7d0fbdd3dc89d6ef8bcb02dcc0f8c70d2a38568b476cf376fe469b +size 129831 diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/metadata.json b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5f795831f8549b893cf5fd13750a07544acb130e --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "shape_outline_fill_00000000", + "generator": "shape_outline_fill", + "timestamp": "2026-02-17T07:36:26.753349", + "parameters": { + "transformation_type": "fill_to_thick", + "style_from": "filled", + "style_to": "thick_outline", + "objects": [ + { + "symbol": "rectangle", + "center": [ + 160, + 256 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "filled" + }, + { + "symbol": "rectangle", + "center": [ + 864, + 256 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "thick_outline" + }, + { + "symbol": "minus", + "center": [ + 160, + 768 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "filled" + }, + { + "symbol": "minus", + "center": [ + 864, + 768 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "thick_outline" + } + ] + }, + "param_hash": "46ffe21b2dc62dcc", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/prompt.txt b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..399d5fcaf6e5b85bade6024b786c123065cea5f3 --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000000/prompt.txt @@ -0,0 +1 @@ +Complete the A:B :: C:? shape-style analogy. Show how the right shape in the second row changes its fill or outline so that it follows the same style transformation used between the first two shapes. \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/final_frame.png b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..78d598248776088907b4c41547ac7813dbc7ad7a Binary files /dev/null and b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/final_frame.png differ diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/first_frame.png b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9ce8485c10ecaed1623a27c5d66e6831f4ad2346 Binary files /dev/null and b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/first_frame.png differ diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/ground_truth.mp4 b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..68506a2ac6e0af4f60ae0d12add5a4e3ff611b47 --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a848826f5b94499c1f7d303d5db99529cfd0f2a0a78e3a98052af7561ea81f3 +size 147264 diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/metadata.json b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0ca935ef227979bdd4b7ee432097bd8d6d6ff663 --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "shape_outline_fill_00000001", + "generator": "shape_outline_fill", + "timestamp": "2026-02-17T07:36:27.403099", + "parameters": { + "transformation_type": "thick_to_fill", + "style_from": "thick_outline", + "style_to": "filled", + "objects": [ + { + "symbol": "minus", + "center": [ + 160, + 256 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "thick_outline" + }, + { + "symbol": "minus", + "center": [ + 864, + 256 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "filled" + }, + { + "symbol": "cross", + "center": [ + 160, + 768 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "thick_outline" + }, + { + "symbol": "cross", + "center": [ + 864, + 768 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "filled" + } + ] + }, + "param_hash": "a23c8498a9371031", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/prompt.txt b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..32e478d2bbb9a1b977f080ea1061708f7f49a3eb --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000001/prompt.txt @@ -0,0 +1 @@ +Follow the visual pattern A:B :: C:? where the first row shows a style change between two identical shapes. Animate the second-row right shape so that its fill or outline style matches the same transformation. \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/final_frame.png b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dd13717f8153f3f42e0cb8d90913f04e148c7c85 Binary files /dev/null and b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/final_frame.png differ diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/first_frame.png b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dadd8a9de44c4f3edc3bc6ebbd8e179a33705bd9 Binary files /dev/null and b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/first_frame.png differ diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/ground_truth.mp4 b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..829b881fe1b372a1f0bf15ef41f286f6039a5608 --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82ce5f65436667eef9d7f7d00d4c208ecee1d52e128da4eb53274787b54f4e68 +size 169192 diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/metadata.json b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7bedba3f60b0e57d09ced65a53059ea824965834 --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "shape_outline_fill_00000002", + "generator": "shape_outline_fill", + "timestamp": "2026-02-17T07:36:28.069369", + "parameters": { + "transformation_type": "fill_to_thin", + "style_from": "filled", + "style_to": "thin_outline", + "objects": [ + { + "symbol": "hexagon", + "center": [ + 160, + 256 + ], + "color": [ + 9, + 39, + 191 + ], + "style": "filled" + }, + { + "symbol": "hexagon", + "center": [ + 864, + 256 + ], + "color": [ + 9, + 39, + 191 + ], + "style": "thin_outline" + }, + { + "symbol": "trapezoid", + "center": [ + 160, + 768 + ], + "color": [ + 9, + 39, + 191 + ], + "style": "filled" + }, + { + "symbol": "trapezoid", + "center": [ + 864, + 768 + ], + "color": [ + 9, + 39, + 191 + ], + "style": "thin_outline" + } + ] + }, + "param_hash": "36dbff2fe4d30439", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/prompt.txt b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..6822547abcbfdb04e388e37405f97f55696f7b35 --- /dev/null +++ b/VBVR-Dataset/shape_outline_fill_task/shape_outline_fill_00000002/prompt.txt @@ -0,0 +1 @@ +In this A:B :: C:? analogy, apply the same style change to the second-row shape as in the first row. The video should clearly show the filled or outlined style of the right shape in the second row matching the pattern. \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/final_frame.png b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..15c356b498568ee630c1788ceb60a97261d0b2b0 Binary files /dev/null and b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/final_frame.png differ diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/first_frame.png b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..550f22515f36afc1b2cb72cb91a7d911bc3ed51f Binary files /dev/null and b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/first_frame.png differ diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/ground_truth.mp4 b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a1c98be6f6eedf7e9bd00155d6c7934fdd2e36e7 --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abcff501ed3fa015ee24f70761913738c906fdd162d16f595760ce015743a6e0 +size 189875 diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/metadata.json b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3c2027bc74f7e2f906cf9569985483ec12f73b90 --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/metadata.json @@ -0,0 +1,108 @@ +{ + "task_id": "shape_outline_then_move_00000000", + "generator": "shape_outline_then_move", + "timestamp": "2026-02-17T07:38:18.139210", + "parameters": { + "transformation_type": "outline_then_move", + "style_from": "filled", + "style_to": "thick_outline", + "move_from": "down_tiny", + "move_to": "up_tiny", + "objects": [ + { + "symbol": "rectangle", + "center": [ + 188.0, + 341 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "filled", + "movement": "center" + }, + { + "symbol": "rectangle", + "center": [ + 476.0, + 341 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "thick_outline", + "movement": "center" + }, + { + "symbol": "rectangle", + "center": [ + 764.0, + 316 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "thick_outline", + "movement": "up_tiny" + }, + { + "symbol": "minus", + "center": [ + 188.0, + 682 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "filled", + "movement": "center" + }, + { + "symbol": "minus", + "center": [ + 476.0, + 682 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "thick_outline", + "movement": "center" + }, + { + "symbol": "minus", + "center": [ + 764.0, + 657 + ], + "color": [ + 70, + 130, + 180 + ], + "style": "thick_outline", + "movement": "up_tiny" + } + ] + }, + "param_hash": "e3ccbac7701717cf", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/prompt.txt b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d9d7ae5c50c43ede4c092a7d89e5c1bea31027a1 --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A→B→C :: D→?→? with two rows of shapes and arrows. On the top row, a filled rectangle first becomes an outline-only rectangle (step 1), then moves up by a tiny amount (step 2). On the bottom row, the minus starts filled. Apply the same two-step transformation: first convert it to outline-only style, then move it up by a tiny amount, keeping its shape and size the same while only the style and position change. \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/final_frame.png b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..665760c5847109c9b09277dfbb06354546778746 Binary files /dev/null and b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/final_frame.png differ diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/first_frame.png b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4a41943ceff0d8bba26795a2b397a27317deb533 Binary files /dev/null and b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/first_frame.png differ diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/ground_truth.mp4 b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cf73550e297956d26c71abd2a4b5a175126c876c --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3427ba31452580d76ee56f2454105ad47656862f046c2d3f37888ed88466ea8 +size 193144 diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/metadata.json b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ecb96f3b02ddd74f4dc125720426d0521c2286cb --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/metadata.json @@ -0,0 +1,108 @@ +{ + "task_id": "shape_outline_then_move_00000001", + "generator": "shape_outline_then_move", + "timestamp": "2026-02-17T07:38:18.858893", + "parameters": { + "transformation_type": "outline_then_move", + "style_from": "outline", + "style_to": "thin_outline", + "move_from": "up_tiny", + "move_to": "up", + "objects": [ + { + "symbol": "minus", + "center": [ + 188.0, + 341 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "outline", + "movement": "center" + }, + { + "symbol": "minus", + "center": [ + 476.0, + 341 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "thin_outline", + "movement": "center" + }, + { + "symbol": "minus", + "center": [ + 764.0, + 281 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "thin_outline", + "movement": "up" + }, + { + "symbol": "cross", + "center": [ + 188.0, + 682 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "outline", + "movement": "center" + }, + { + "symbol": "cross", + "center": [ + 476.0, + 682 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "thin_outline", + "movement": "center" + }, + { + "symbol": "cross", + "center": [ + 764.0, + 622 + ], + "color": [ + 38, + 191, + 114 + ], + "style": "thin_outline", + "movement": "up" + } + ] + }, + "param_hash": "5fb9bad5cc3faf4d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/prompt.txt b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..5008f632832672c0fab94350bb0eb2af006f86ba --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A→B→C :: D→?→? with two rows of shapes and arrows. On the top row, a filled minus first becomes an outline-only minus (step 1), then moves up (step 2). On the bottom row, the cross starts filled. Apply the same two-step transformation: first convert it to outline-only style, then move it up, keeping its shape and size the same while only the style and position change. \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/final_frame.png b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7693f3d34b14a389a999d1c535370d105171d1e2 Binary files /dev/null and b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/final_frame.png differ diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/first_frame.png b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f400de00f586dd5ff6b7bf8257b093ae4c4bdfe5 Binary files /dev/null and b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/first_frame.png differ diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/ground_truth.mp4 b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..40b4ec31bf933f9720a47bc1a75e88c2eba130bc --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c95d023afa21f0c2dfcb386e0c97793c82ced5beeb85e3f8b9a56b034252ac9 +size 253380 diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/metadata.json b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d3ebe022c64ac846a7b0ad732bb0d4d2f95b30bd --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/metadata.json @@ -0,0 +1,108 @@ +{ + "task_id": "shape_outline_then_move_00000002", + "generator": "shape_outline_then_move", + "timestamp": "2026-02-17T07:38:19.606994", + "parameters": { + "transformation_type": "outline_then_move", + "style_from": "thick_outline", + "style_to": "outline", + "move_from": "up_small", + "move_to": "up_tiny", + "objects": [ + { + "symbol": "arrow", + "center": [ + 188.0, + 341 + ], + "color": [ + 191, + 87, + 66 + ], + "style": "thick_outline", + "movement": "center" + }, + { + "symbol": "arrow", + "center": [ + 476.0, + 341 + ], + "color": [ + 191, + 87, + 66 + ], + "style": "outline", + "movement": "center" + }, + { + "symbol": "arrow", + "center": [ + 764.0, + 316 + ], + "color": [ + 191, + 87, + 66 + ], + "style": "outline", + "movement": "up_tiny" + }, + { + "symbol": "hexagon", + "center": [ + 188.0, + 682 + ], + "color": [ + 191, + 87, + 66 + ], + "style": "thick_outline", + "movement": "center" + }, + { + "symbol": "hexagon", + "center": [ + 476.0, + 682 + ], + "color": [ + 191, + 87, + 66 + ], + "style": "outline", + "movement": "center" + }, + { + "symbol": "hexagon", + "center": [ + 764.0, + 657 + ], + "color": [ + 191, + 87, + 66 + ], + "style": "outline", + "movement": "up_tiny" + } + ] + }, + "param_hash": "2eb1695421e53cbd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/prompt.txt b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..425e80c742c2cc02b1b87ddfe13cbf2dec6a3181 --- /dev/null +++ b/VBVR-Dataset/shape_outline_then_move_task/shape_outline_then_move_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows an analogy A→B→C :: D→?→? with two rows of shapes and arrows. On the top row, a filled arrow first becomes an outline-only arrow (step 1), then moves up by a tiny amount (step 2). On the bottom row, the hexagon starts filled. Apply the same two-step transformation: first convert it to outline-only style, then move it up by a tiny amount, keeping its shape and size the same while only the style and position change. \ No newline at end of file diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/final_frame.png b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6761ae5c1f98e4a90717924f711667c38a01506d Binary files /dev/null and b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/final_frame.png differ diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/first_frame.png b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b1bff0725469d5d1950fad813fe383ae6fc8b48e Binary files /dev/null and b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/first_frame.png differ diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/ground_truth.mp4 b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ba9d1536c5e08f1afd306d07c17e1287e5ea9318 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a9db3304f871d0d332588517981d16942f54c902e2c4edaffaa68887587b46f +size 411131 diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/metadata.json b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fc3a31cba59feda4753a33c88a51f91a294ce588 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/metadata.json @@ -0,0 +1,73 @@ +{ + "task_id": "shape_rotation_00000000", + "generator": "shape_rotation", + "timestamp": "2026-02-17T08:13:02.077182", + "parameters": { + "transformation_type": "rotation", + "rotation_angle": 60, + "objects": [ + { + "symbol": "star", + "center": [ + 240, + 256 + ], + "color": [ + 70, + 130, + 180 + ], + "rotation": 0.0 + }, + { + "symbol": "star", + "center": [ + 784, + 256 + ], + "color": [ + 70, + 130, + 180 + ], + "rotation": 60 + }, + { + "symbol": "parallelogram", + "center": [ + 240, + 768 + ], + "color": [ + 70, + 130, + 180 + ], + "rotation": 0.0 + }, + { + "symbol": "parallelogram", + "center": [ + 784, + 768 + ], + "color": [ + 70, + 130, + 180 + ], + "rotation": 60 + } + ] + }, + "param_hash": "5524a756f943f0c2", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/prompt.txt b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9ea4a90b3eba32634c37be8554bdabe1fe61e14d --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000000/prompt.txt @@ -0,0 +1 @@ +The image shows a visual analogy A:B :: C:? using simple shapes. A and C are the original shapes, B shows shape A after a rotation, and ? is the unknown result. Each shape has a small black marker dot to indicate its orientation. Your task is to infer the single rotation that maps A (star) to B, then apply the same rotation to C (parallelogram) around its geometric center. The answer at ? must be shape C rotated by this angle, with size and position unchanged, so that the rotational relationship between A and B is mirrored between C and ?. \ No newline at end of file diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/final_frame.png b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..88ac50e4874965169464e4f1c0dc938ccbabbfb2 Binary files /dev/null and b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/final_frame.png differ diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/first_frame.png b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..19550584dc253eb5f92c896e0b0a57ca5d88becc Binary files /dev/null and b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/first_frame.png differ diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/ground_truth.mp4 b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..efd9c2725fa38801106379002da55137ec769a70 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5adda8834279bffa72e48d4fdac25974f9e3edd19c0283206ee41929ac115d2a +size 408720 diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/metadata.json b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..3aaf78811893a03ef281d88bc951499923d5855a --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/metadata.json @@ -0,0 +1,73 @@ +{ + "task_id": "shape_rotation_00000001", + "generator": "shape_rotation", + "timestamp": "2026-02-17T08:13:02.936941", + "parameters": { + "transformation_type": "rotation", + "rotation_angle": 157.5, + "objects": [ + { + "symbol": "parallelogram", + "center": [ + 240, + 256 + ], + "color": [ + 38, + 191, + 114 + ], + "rotation": 0.0 + }, + { + "symbol": "parallelogram", + "center": [ + 784, + 256 + ], + "color": [ + 38, + 191, + 114 + ], + "rotation": 157.5 + }, + { + "symbol": "octagon", + "center": [ + 240, + 768 + ], + "color": [ + 38, + 191, + 114 + ], + "rotation": 0.0 + }, + { + "symbol": "octagon", + "center": [ + 784, + 768 + ], + "color": [ + 38, + 191, + 114 + ], + "rotation": 157.5 + } + ] + }, + "param_hash": "07253a574e4e631e", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/prompt.txt b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7e2f975f50bd672f181a0b83f4028a3446c86c5 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000001/prompt.txt @@ -0,0 +1 @@ +The image shows a visual analogy A:B :: C:? using simple shapes. A and C are the original shapes, B shows shape A after a rotation, and ? is the unknown result. Each shape has a small black marker dot to indicate its orientation. Your task is to infer the single rotation that maps A (parallelogram) to B, then apply the same rotation to C (octagon) around its geometric center. The answer at ? must be shape C rotated by this angle, with size and position unchanged, so that the rotational relationship between A and B is mirrored between C and ?. \ No newline at end of file diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/final_frame.png b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c8e1e7c65e3ba32b228a5fe1ff172b505d6fb7e9 Binary files /dev/null and b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/final_frame.png differ diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/first_frame.png b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2e3e9d410d87c238624ef1af17d1e19c0b450058 Binary files /dev/null and b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/first_frame.png differ diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/ground_truth.mp4 b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4484e493818ca2e2dae7f4337363c35abcea1478 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba188a412833ddebf654f6a9f8e4ec75a8d6c0068fb55b4d08ade993c2303874 +size 482213 diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/metadata.json b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1e76d07a95619f1bbbe543679dc90279d7945259 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/metadata.json @@ -0,0 +1,73 @@ +{ + "task_id": "shape_rotation_00000002", + "generator": "shape_rotation", + "timestamp": "2026-02-17T08:13:03.797674", + "parameters": { + "transformation_type": "rotation", + "rotation_angle": 202.5, + "objects": [ + { + "symbol": "trapezoid", + "center": [ + 240, + 256 + ], + "color": [ + 191, + 87, + 66 + ], + "rotation": 0.0 + }, + { + "symbol": "trapezoid", + "center": [ + 784, + 256 + ], + "color": [ + 191, + 87, + 66 + ], + "rotation": 202.5 + }, + { + "symbol": "rectangle", + "center": [ + 240, + 768 + ], + "color": [ + 191, + 87, + 66 + ], + "rotation": 0.0 + }, + { + "symbol": "rectangle", + "center": [ + 784, + 768 + ], + "color": [ + 191, + 87, + 66 + ], + "rotation": 202.5 + } + ] + }, + "param_hash": "0f54ffb73a6b9f9d", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/prompt.txt b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cb7feb115f5716b30c957e59682febecb2e93f85 --- /dev/null +++ b/VBVR-Dataset/shape_rotation_task/shape_rotation_00000002/prompt.txt @@ -0,0 +1 @@ +The image shows a visual analogy A:B :: C:? using simple shapes. A and C are the original shapes, B shows shape A after a rotation, and ? is the unknown result. Each shape has a small black marker dot to indicate its orientation. Your task is to infer the single rotation that maps A (trapezoid) to B, then apply the same rotation to C (rectangle) around its geometric center. The answer at ? must be shape C rotated by this angle, with size and position unchanged, so that the rotational relationship between A and B is mirrored between C and ?. \ No newline at end of file diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/final_frame.png b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..584eaa66fe3153e0370226580cc49d387ef3d3e4 Binary files /dev/null and b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/final_frame.png differ diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/first_frame.png b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..bcd7bfc5ec0a2a036669d5c23c9ce694e0772379 Binary files /dev/null and b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/first_frame.png differ diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/ground_truth.mp4 b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0791463b8daf5b4714ff9f0f928c540a5dca97b5 --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f29f9afa7dd6bff65c911c9d35cb4b5bd46f3963ed4c46abf641a04a95271a82 +size 229007 diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/metadata.json b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..273fe03e135aa1b5f657a9d1b81aa246f6f316b9 --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/metadata.json @@ -0,0 +1,92 @@ +{ + "task_id": "shape_scale_then_outline_00000000", + "generator": "shape_scale_then_outline", + "timestamp": "2026-02-17T07:38:30.777014", + "parameters": { + "transformation_type": "scale_then_outline", + "shape_a": "rectangle", + "shape_b": "rectangle", + "shape_c": "rectangle", + "shape_d": "minus", + "shape_e": "minus", + "shape_f": "minus", + "scale_from": "tiny", + "scale_to": "huge", + "style_from": "filled", + "style_to": "thick_outline", + "color": [ + 70, + 130, + 180 + ], + "description": "Step 1: tiny → huge, Step 2: filled → thick_outline", + "signature": [ + [ + "color", + [ + 70, + 130, + 180 + ] + ], + [ + "description", + "Step 1: tiny → huge, Step 2: filled → thick_outline" + ], + [ + "scale_from", + "tiny" + ], + [ + "scale_to", + "huge" + ], + [ + "shape_a", + "rectangle" + ], + [ + "shape_b", + "rectangle" + ], + [ + "shape_c", + "rectangle" + ], + [ + "shape_d", + "minus" + ], + [ + "shape_e", + "minus" + ], + [ + "shape_f", + "minus" + ], + [ + "style_from", + "filled" + ], + [ + "style_to", + "thick_outline" + ], + [ + "transformation_type", + "scale_then_outline" + ] + ] + }, + "param_hash": "65b4560b49213327", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/prompt.txt b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ca84e97d8372d29074fca3c92de1614acb18b43d --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000000/prompt.txt @@ -0,0 +1 @@ +Animate the two-step transformation: scale change followed by fill-to-outline conversion. \ No newline at end of file diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/final_frame.png b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7291774f01e48b879492afeb9f4719644f97dc90 Binary files /dev/null and b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/final_frame.png differ diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/first_frame.png b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c30588dfa63cb701e63f91e637b0d757c8f8ab12 Binary files /dev/null and b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/first_frame.png differ diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/ground_truth.mp4 b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e6670bc08e0e001229108ce48aefa8062fe8168e --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9036cd2cbaeb6642ed859c259c423ea810b16726b13174fb4386d7683fe32d2 +size 222344 diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/metadata.json b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4d4b9270fbd304490f8dda170dd3bfe0b48d1a36 --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/metadata.json @@ -0,0 +1,92 @@ +{ + "task_id": "shape_scale_then_outline_00000001", + "generator": "shape_scale_then_outline", + "timestamp": "2026-02-17T07:38:31.785823", + "parameters": { + "transformation_type": "scale_then_outline", + "shape_a": "minus", + "shape_b": "minus", + "shape_c": "minus", + "shape_d": "cross", + "shape_e": "cross", + "shape_f": "cross", + "scale_from": "medium", + "scale_to": "large", + "style_from": "thin_outline", + "style_to": "thick_outline", + "color": [ + 38, + 191, + 114 + ], + "description": "Step 1: medium → large, Step 2: thin_outline → thick_outline", + "signature": [ + [ + "color", + [ + 38, + 191, + 114 + ] + ], + [ + "description", + "Step 1: medium → large, Step 2: thin_outline → thick_outline" + ], + [ + "scale_from", + "medium" + ], + [ + "scale_to", + "large" + ], + [ + "shape_a", + "minus" + ], + [ + "shape_b", + "minus" + ], + [ + "shape_c", + "minus" + ], + [ + "shape_d", + "cross" + ], + [ + "shape_e", + "cross" + ], + [ + "shape_f", + "cross" + ], + [ + "style_from", + "thin_outline" + ], + [ + "style_to", + "thick_outline" + ], + [ + "transformation_type", + "scale_then_outline" + ] + ] + }, + "param_hash": "1572a92e721150b6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/prompt.txt b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..55fbd8ee72444a3912a0d99aef0bb843c555f75b --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000001/prompt.txt @@ -0,0 +1 @@ +Complete the analogy by revealing the shape with the correct scale and outline style. \ No newline at end of file diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/final_frame.png b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4cb153c608f6b56d2cd36274b2970123f98f4d53 Binary files /dev/null and b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/final_frame.png differ diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/first_frame.png b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8781f46cdf166389161184eab3f9efdba9a27abd Binary files /dev/null and b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/first_frame.png differ diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/ground_truth.mp4 b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..bb18382d2c4c364c896bdbb435c4be2438acfff5 --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:512a36fbe0703ef879aab05e0aa8e5f632fb328cfae3adf40f5dd204e9fe750e +size 372819 diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/metadata.json b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..87a00a1d551a9c4f15221c0e56a839dff4d8c112 --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/metadata.json @@ -0,0 +1,92 @@ +{ + "task_id": "shape_scale_then_outline_00000002", + "generator": "shape_scale_then_outline", + "timestamp": "2026-02-17T07:38:32.848994", + "parameters": { + "transformation_type": "scale_then_outline", + "shape_a": "hexagon", + "shape_b": "hexagon", + "shape_c": "hexagon", + "shape_d": "trapezoid", + "shape_e": "trapezoid", + "shape_f": "trapezoid", + "scale_from": "tiny", + "scale_to": "huge", + "style_from": "thick_outline", + "style_to": "thin_outline", + "color": [ + 9, + 39, + 191 + ], + "description": "Step 1: tiny → huge, Step 2: thick_outline → thin_outline", + "signature": [ + [ + "color", + [ + 9, + 39, + 191 + ] + ], + [ + "description", + "Step 1: tiny → huge, Step 2: thick_outline → thin_outline" + ], + [ + "scale_from", + "tiny" + ], + [ + "scale_to", + "huge" + ], + [ + "shape_a", + "hexagon" + ], + [ + "shape_b", + "hexagon" + ], + [ + "shape_c", + "hexagon" + ], + [ + "shape_d", + "trapezoid" + ], + [ + "shape_e", + "trapezoid" + ], + [ + "shape_f", + "trapezoid" + ], + [ + "style_from", + "thick_outline" + ], + [ + "style_to", + "thin_outline" + ], + [ + "transformation_type", + "scale_then_outline" + ] + ] + }, + "param_hash": "77f22e308cf004df", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/prompt.txt b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cb7b56d97e3d9be387e76c39fad199884ffb955 --- /dev/null +++ b/VBVR-Dataset/shape_scale_then_outline_task/shape_scale_then_outline_00000002/prompt.txt @@ -0,0 +1 @@ +Show the shape first changing size and then becoming outline-only. Both transformations should match the example pattern. \ No newline at end of file diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/final_frame.png b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..354c086d8e9e691aaccf9e3bf1249b7d25627223 Binary files /dev/null and b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/final_frame.png differ diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/first_frame.png b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d41178c7c0e6d474adf1f8357f05836dfc6684d2 Binary files /dev/null and b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/first_frame.png differ diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/ground_truth.mp4 b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..2cce1016968827906454744240827f08e9a92306 --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdc22f4e0cc381166b4887ad2a5555b1332fb37d6997d9c92d26ad4222cda78 +size 589545 diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/metadata.json b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..fab6a52e006cccb1db2e62ec52e6ca99e87e2348 --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/metadata.json @@ -0,0 +1,142 @@ +{ + "task_id": "sliding_puzzle_00000000", + "generator": "sliding_puzzle", + "timestamp": "2026-02-27T07:04:14.657564", + "parameters": { + "size": 3, + "min_moves": 3, + "max_moves": 10, + "solution_length": 9, + "tile_color_theme": "purple", + "generation_method": "random", + "objects": [ + { + "symbol": "tile_1", + "value": 1, + "initial_position": [ + 1, + 0 + ], + "target_position": [ + 0, + 0 + ], + "color": "purple" + }, + { + "symbol": "tile_2", + "value": 2, + "initial_position": [ + 0, + 0 + ], + "target_position": [ + 0, + 1 + ], + "color": "purple" + }, + { + "symbol": "tile_3", + "value": 3, + "initial_position": [ + 0, + 1 + ], + "target_position": [ + 0, + 2 + ], + "color": "purple" + }, + { + "symbol": "tile_4", + "value": 4, + "initial_position": [ + 2, + 0 + ], + "target_position": [ + 1, + 0 + ], + "color": "purple" + }, + { + "symbol": "tile_5", + "value": 5, + "initial_position": [ + 0, + 2 + ], + "target_position": [ + 1, + 1 + ], + "color": "purple" + }, + { + "symbol": "tile_6", + "value": 6, + "initial_position": [ + 2, + 2 + ], + "target_position": [ + 1, + 2 + ], + "color": "purple" + }, + { + "symbol": "tile_7", + "value": 7, + "initial_position": [ + 2, + 1 + ], + "target_position": [ + 2, + 0 + ], + "color": "purple" + }, + { + "symbol": "tile_8", + "value": 8, + "initial_position": [ + 1, + 1 + ], + "target_position": [ + 2, + 1 + ], + "color": "purple" + }, + { + "symbol": "blank", + "value": 0, + "initial_position": [ + 1, + 2 + ], + "target_position": [ + 2, + 2 + ], + "color": null + } + ] + }, + "param_hash": "b83a25ce04e6e619", + "generation": { + "seed": 2026, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/prompt.txt b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8005f5d5b37744c9e5faef2a49bb5c5214dfc8fd --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000000/prompt.txt @@ -0,0 +1,7 @@ +Complete this sliding puzzle. The goal is to arrange the numbered tiles in sequential order (filling each row from left to right, with rows from top to bottom), with the blank space at the bottom-right corner. + +Rules: Only tiles adjacent to the blank space can be moved. Slide one tile per move into the blank space. + +Complete in exactly 9 moves. + +Do not make extra moves. Keep the camera view fixed and maintain the grid structure unchanged. \ No newline at end of file diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/final_frame.png b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..344926debdac62809fda2036f48d20e026c3f46c Binary files /dev/null and b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/final_frame.png differ diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/first_frame.png b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7f9b13d32225cf9e1a5f9689f5ee2b20253c4919 Binary files /dev/null and b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/first_frame.png differ diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/ground_truth.mp4 b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..34ddbe319facccf6f837399c4d4076305ec15147 --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e33eb88851b4284b1e00805c451196dee56b833c6dd3796a1206a452d41563 +size 843073 diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/metadata.json b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..bf2bafcab3f5accd0c3c761ff332a68583716e37 --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/metadata.json @@ -0,0 +1,350 @@ +{ + "task_id": "sliding_puzzle_00000001", + "generator": "sliding_puzzle", + "timestamp": "2026-02-27T07:04:15.472972", + "parameters": { + "size": 5, + "min_moves": 8, + "max_moves": 15, + "solution_length": 9, + "tile_color_theme": "magenta", + "generation_method": "random", + "objects": [ + { + "symbol": "tile_1", + "value": 1, + "initial_position": [ + 0, + 0 + ], + "target_position": [ + 0, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_2", + "value": 2, + "initial_position": [ + 0, + 1 + ], + "target_position": [ + 0, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_3", + "value": 3, + "initial_position": [ + 0, + 2 + ], + "target_position": [ + 0, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_4", + "value": 4, + "initial_position": [ + 0, + 3 + ], + "target_position": [ + 0, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_5", + "value": 5, + "initial_position": [ + 0, + 4 + ], + "target_position": [ + 0, + 4 + ], + "color": "magenta" + }, + { + "symbol": "tile_6", + "value": 6, + "initial_position": [ + 1, + 0 + ], + "target_position": [ + 1, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_7", + "value": 7, + "initial_position": [ + 1, + 1 + ], + "target_position": [ + 1, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_8", + "value": 8, + "initial_position": [ + 2, + 2 + ], + "target_position": [ + 1, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_9", + "value": 9, + "initial_position": [ + 1, + 2 + ], + "target_position": [ + 1, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_10", + "value": 10, + "initial_position": [ + 1, + 3 + ], + "target_position": [ + 1, + 4 + ], + "color": "magenta" + }, + { + "symbol": "tile_11", + "value": 11, + "initial_position": [ + 2, + 0 + ], + "target_position": [ + 2, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_12", + "value": 12, + "initial_position": [ + 2, + 1 + ], + "target_position": [ + 2, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_13", + "value": 13, + "initial_position": [ + 2, + 3 + ], + "target_position": [ + 2, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_14", + "value": 14, + "initial_position": [ + 3, + 3 + ], + "target_position": [ + 2, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_15", + "value": 15, + "initial_position": [ + 1, + 4 + ], + "target_position": [ + 2, + 4 + ], + "color": "magenta" + }, + { + "symbol": "tile_16", + "value": 16, + "initial_position": [ + 3, + 0 + ], + "target_position": [ + 3, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_17", + "value": 17, + "initial_position": [ + 3, + 1 + ], + "target_position": [ + 3, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_18", + "value": 18, + "initial_position": [ + 3, + 2 + ], + "target_position": [ + 3, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_19", + "value": 19, + "initial_position": [ + 2, + 4 + ], + "target_position": [ + 3, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_20", + "value": 20, + "initial_position": [ + 4, + 4 + ], + "target_position": [ + 3, + 4 + ], + "color": "magenta" + }, + { + "symbol": "tile_21", + "value": 21, + "initial_position": [ + 4, + 0 + ], + "target_position": [ + 4, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_22", + "value": 22, + "initial_position": [ + 4, + 1 + ], + "target_position": [ + 4, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_23", + "value": 23, + "initial_position": [ + 4, + 2 + ], + "target_position": [ + 4, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_24", + "value": 24, + "initial_position": [ + 4, + 3 + ], + "target_position": [ + 4, + 3 + ], + "color": "magenta" + }, + { + "symbol": "blank", + "value": 0, + "initial_position": [ + 3, + 4 + ], + "target_position": [ + 4, + 4 + ], + "color": null + } + ] + }, + "param_hash": "5f07c245d666c3a5", + "generation": { + "seed": 2026, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/prompt.txt b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..8005f5d5b37744c9e5faef2a49bb5c5214dfc8fd --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000001/prompt.txt @@ -0,0 +1,7 @@ +Complete this sliding puzzle. The goal is to arrange the numbered tiles in sequential order (filling each row from left to right, with rows from top to bottom), with the blank space at the bottom-right corner. + +Rules: Only tiles adjacent to the blank space can be moved. Slide one tile per move into the blank space. + +Complete in exactly 9 moves. + +Do not make extra moves. Keep the camera view fixed and maintain the grid structure unchanged. \ No newline at end of file diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/final_frame.png b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..49f9b072e404e1312c7fd67b090e4f7b1b716422 Binary files /dev/null and b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/final_frame.png differ diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/first_frame.png b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4a5a3c3d374a40441d81a2ef4c5d7f63a684fed4 Binary files /dev/null and b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/first_frame.png differ diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/ground_truth.mp4 b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..dd5eeb6c39113629581d8ce5c698f2251a7c28e1 --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48cde79fd354f72ff41db2f8bf0d0e41cd99d2e21689546e790fc8f3bd89aa9 +size 472658 diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/metadata.json b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..253b30a297dcfeffe8fbc7df363f3c2b4f64b09b --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/metadata.json @@ -0,0 +1,233 @@ +{ + "task_id": "sliding_puzzle_00000002", + "generator": "sliding_puzzle", + "timestamp": "2026-02-27T07:04:16.046275", + "parameters": { + "size": 4, + "min_moves": 5, + "max_moves": 12, + "solution_length": 6, + "tile_color_theme": "magenta", + "generation_method": "random", + "objects": [ + { + "symbol": "tile_1", + "value": 1, + "initial_position": [ + 0, + 0 + ], + "target_position": [ + 0, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_2", + "value": 2, + "initial_position": [ + 0, + 1 + ], + "target_position": [ + 0, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_3", + "value": 3, + "initial_position": [ + 0, + 2 + ], + "target_position": [ + 0, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_4", + "value": 4, + "initial_position": [ + 0, + 3 + ], + "target_position": [ + 0, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_5", + "value": 5, + "initial_position": [ + 1, + 0 + ], + "target_position": [ + 1, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_6", + "value": 6, + "initial_position": [ + 2, + 1 + ], + "target_position": [ + 1, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_7", + "value": 7, + "initial_position": [ + 1, + 1 + ], + "target_position": [ + 1, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_8", + "value": 8, + "initial_position": [ + 1, + 2 + ], + "target_position": [ + 1, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_9", + "value": 9, + "initial_position": [ + 2, + 0 + ], + "target_position": [ + 2, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_10", + "value": 10, + "initial_position": [ + 2, + 2 + ], + "target_position": [ + 2, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_11", + "value": 11, + "initial_position": [ + 3, + 2 + ], + "target_position": [ + 2, + 2 + ], + "color": "magenta" + }, + { + "symbol": "tile_12", + "value": 12, + "initial_position": [ + 2, + 3 + ], + "target_position": [ + 2, + 3 + ], + "color": "magenta" + }, + { + "symbol": "tile_13", + "value": 13, + "initial_position": [ + 3, + 0 + ], + "target_position": [ + 3, + 0 + ], + "color": "magenta" + }, + { + "symbol": "tile_14", + "value": 14, + "initial_position": [ + 3, + 1 + ], + "target_position": [ + 3, + 1 + ], + "color": "magenta" + }, + { + "symbol": "tile_15", + "value": 15, + "initial_position": [ + 3, + 3 + ], + "target_position": [ + 3, + 2 + ], + "color": "magenta" + }, + { + "symbol": "blank", + "value": 0, + "initial_position": [ + 1, + 3 + ], + "target_position": [ + 3, + 3 + ], + "color": null + } + ] + }, + "param_hash": "19fe4f0af43370b3", + "generation": { + "seed": 2026, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/prompt.txt b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..73ab756ff1cddde9369be6bf6b7a061a9afd25fe --- /dev/null +++ b/VBVR-Dataset/sliding_puzzle_task/sliding_puzzle_00000002/prompt.txt @@ -0,0 +1,7 @@ +Complete this sliding puzzle. The goal is to arrange the numbered tiles in sequential order (filling each row from left to right, with rows from top to bottom), with the blank space at the bottom-right corner. + +Rules: Only tiles adjacent to the blank space can be moved. Slide one tile per move into the blank space. + +Complete in exactly 6 moves. + +Do not make extra moves. Keep the camera view fixed and maintain the grid structure unchanged. \ No newline at end of file diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/final_frame.png b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a11522d965283075e2f567762a371cead2c20af1 Binary files /dev/null and b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/final_frame.png differ diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/first_frame.png b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4a9f6ae519eaa8a7621d4340887a5fb40c876bae Binary files /dev/null and b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/first_frame.png differ diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/ground_truth.mp4 b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cefc74be670cb24319f81d19985aa3ecf5241ebf --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f51cba7170a20dbe64d20e8edd3aa2d526f090dc650b565ab325387881e4e00 +size 208169 diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/metadata.json b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..634529270f58a73c55162d6d7dfd308ca89a0d31 --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "sort_objects_by_rule_00000000", + "generator": "sort_objects_by_rule", + "timestamp": "2026-02-17T07:07:21.388047", + "parameters": { + "objects": [ + { + "id": 1, + "shape": "star", + "color": "purple", + "size": 0.21323, + "initial_position": [ + 0.240198, + 0.818868 + ], + "target_position": [ + 0.5, + 0.176615 + ] + }, + { + "id": 2, + "shape": "star", + "color": "gray", + "size": 0.067656, + "initial_position": [ + 0.621059, + 0.358481 + ], + "target_position": [ + 0.5, + 0.896172 + ] + } + ], + "arrange": "top-down", + "sort": "big-small" + }, + "param_hash": "4b81cc5c1dec9390", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/prompt.txt b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..efcb4b4895eb40ed80c7a8a258370034820ee062 --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 2 star objects of different sizes. Arrange the objects in a vertical column from top to bottom, largest to smallest. \ No newline at end of file diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/final_frame.png b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..582a950f840488ebe456da5db1cc2dc1429829f1 Binary files /dev/null and b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/final_frame.png differ diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/first_frame.png b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2ba8a6c03e9803801a0cd3d7acbffa59245226d6 Binary files /dev/null and b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/first_frame.png differ diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/ground_truth.mp4 b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ab9e36a6256a9eb54ab2d213bb24e9138fa8887b --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd73fea964b9cf26017d0a4bb19dfa3a0ac33c3979664a702221f47a925b8d9e +size 240294 diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/metadata.json b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..2b59cab4114e9741c417019820fddca7d5f204e9 --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/metadata.json @@ -0,0 +1,49 @@ +{ + "task_id": "sort_objects_by_rule_00000001", + "generator": "sort_objects_by_rule", + "timestamp": "2026-02-17T07:07:22.084441", + "parameters": { + "objects": [ + { + "id": 1, + "shape": "circle", + "color": "magenta", + "size": 0.069261, + "initial_position": [ + 0.124128, + 0.530336 + ], + "target_position": [ + 0.104631, + 0.5 + ] + }, + { + "id": 2, + "shape": "circle", + "color": "lime", + "size": 0.211555, + "initial_position": [ + 0.433205, + 0.473342 + ], + "target_position": [ + 0.824223, + 0.5 + ] + } + ], + "arrange": "left-right", + "sort": "small-big" + }, + "param_hash": "15b45f8caf4e1da0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/prompt.txt b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..022edd8b17754f0a05ae66bd99bd6f0aa4ddcb8b --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 2 circle objects of different sizes. Arrange the objects in a vertical column from top to bottom, smallest to largest. \ No newline at end of file diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/final_frame.png b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a2d4a76be579001f214292caf2e1f1130d57c71f Binary files /dev/null and b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/final_frame.png differ diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/first_frame.png b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..dfe41aeef09b6bf20016abb1b71d7305014a1e7b Binary files /dev/null and b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/first_frame.png differ diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/ground_truth.mp4 b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..205027aee1726d6a813e7743cf9b7e7b2056ed5f --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8b7dd4e6bf4c6c33b21ce2ce96f0ed783a486f83225f63cf1e187078eaa5d4 +size 336905 diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/metadata.json b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7e3519dcdc6a8758254f82eb3a5df295b5a3f0ec --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/metadata.json @@ -0,0 +1,77 @@ +{ + "task_id": "sort_objects_by_rule_00000002", + "generator": "sort_objects_by_rule", + "timestamp": "2026-02-17T07:07:22.800491", + "parameters": { + "objects": [ + { + "id": 1, + "shape": "triangle", + "color": "pink", + "size": 0.227894, + "initial_position": [ + 0.274397, + 0.287661 + ], + "target_position": [ + 0.183947, + 0.5 + ] + }, + { + "id": 2, + "shape": "triangle", + "color": "yellow", + "size": 0.16845, + "initial_position": [ + 0.693297, + 0.781185 + ], + "target_position": [ + 0.470532, + 0.5 + ] + }, + { + "id": 3, + "shape": "triangle", + "color": "navy", + "size": 0.109403, + "initial_position": [ + 0.646143, + 0.562121 + ], + "target_position": [ + 0.697871, + 0.5 + ] + }, + { + "id": 4, + "shape": "triangle", + "color": "lime", + "size": 0.089014, + "initial_position": [ + 0.847761, + 0.39312 + ], + "target_position": [ + 0.885493, + 0.5 + ] + } + ], + "arrange": "left-right", + "sort": "big-small" + }, + "param_hash": "df5ffdb3fb5b5a46", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/prompt.txt b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..89e376822f0aed449346dceb6f3858d736805476 --- /dev/null +++ b/VBVR-Dataset/sort_objects_by_rule_task/sort_objects_by_rule_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 triangle objects of different sizes. Arrange the objects in a vertical column from top to bottom, largest to smallest. \ No newline at end of file diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/final_frame.png b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3e520f098b594e0711fc1c931a1df1aabda9e2e5 Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/final_frame.png differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/first_frame.png b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b8a1a45be17eaa49ee102d5a7984cc8b1396aeee Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/first_frame.png differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/ground_truth.mp4 b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..aa4cf91067398af46fb61d1511cb097243ef41c4 Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/metadata.json b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..06d9ce619fe1463996e00b74200627e5edda40e5 --- /dev/null +++ b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/metadata.json @@ -0,0 +1,73 @@ +{ + "task_id": "spot_unique_non_repeated_color_00000000", + "generator": "spot_unique_non_repeated_color", + "timestamp": "2026-02-17T06:52:05.633627", + "parameters": { + "shapes": [ + { + "type": "circle", + "color": [ + 161, + 22, + 229 + ], + "center": [ + 761.311465, + 512.591377 + ] + }, + { + "type": "rectangle", + "color": [ + 229, + 142, + 22 + ], + "center": [ + 846.563436, + 122.309768 + ] + }, + { + "type": "polygon", + "color": [ + 229, + 142, + 22 + ], + "center": [ + 137.295235, + 542.241454 + ] + }, + { + "type": "triangle", + "color": [ + 229, + 142, + 22 + ], + "center": [ + 479.140356, + 696.306915 + ] + } + ], + "unique_shape_index": 0, + "unique_color": [ + 161, + 22, + 229 + ] + }, + "param_hash": "fbceced820766177", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/prompt.txt b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..89cefe9ea72fbdc7d912212856379bb02c1b4fd6 --- /dev/null +++ b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 4 geometric shapes with different colors. Exactly one color appears only once, while every other color appears at least twice. First find the shape whose color is unique, then outline that entire shape with a black contour. Do not add any extra marks. Show the complete marking process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/final_frame.png b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7559c608746d25cb566eb77d4f637c289db87c0b Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/final_frame.png differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/first_frame.png b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..80d040a58c4b9859910f3c199edbf22bad09774f Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/first_frame.png differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/ground_truth.mp4 b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..41561ed693fcea4a58af633fba3f94ce31d41fdf Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/metadata.json b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..45e09aa3eee0d0b75fd1e42bd206784fec254fb1 --- /dev/null +++ b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/metadata.json @@ -0,0 +1,61 @@ +{ + "task_id": "spot_unique_non_repeated_color_00000001", + "generator": "spot_unique_non_repeated_color", + "timestamp": "2026-02-17T06:52:06.000915", + "parameters": { + "shapes": [ + { + "type": "triangle", + "color": [ + 22, + 229, + 190 + ], + "center": [ + 696.717971, + 672.024622 + ] + }, + { + "type": "polygon", + "color": [ + 22, + 70, + 229 + ], + "center": [ + 382.802669, + 805.901448 + ] + }, + { + "type": "circle", + "color": [ + 22, + 229, + 190 + ], + "center": [ + 861.65158, + 133.880574 + ] + } + ], + "unique_shape_index": 1, + "unique_color": [ + 22, + 70, + 229 + ] + }, + "param_hash": "6c2330e11f679720", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/prompt.txt b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0927f7759c71b166f068a425dc35a9e3c2536189 --- /dev/null +++ b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 geometric shapes with different colors. Exactly one color appears only once, while every other color appears at least twice. First find the shape whose color is unique, then outline that entire shape with a black contour. Do not add any extra marks. Show the complete marking process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/final_frame.png b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..cb2333be2be3172caa56e6c9cbc20cfab8bd94c7 Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/final_frame.png differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/first_frame.png b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7be81322ad8bc6ccd3d8ec361126a483d4de825c Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/first_frame.png differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/ground_truth.mp4 b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..321dd0cce02e7ee9a8c75c0edda00930d4544168 Binary files /dev/null and b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/metadata.json b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9389658e82c7ed230810f91f1813d68f7fb25922 --- /dev/null +++ b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/metadata.json @@ -0,0 +1,97 @@ +{ + "task_id": "spot_unique_non_repeated_color_00000002", + "generator": "spot_unique_non_repeated_color", + "timestamp": "2026-02-17T06:52:06.335227", + "parameters": { + "shapes": [ + { + "type": "polygon", + "color": [ + 22, + 229, + 33 + ], + "center": [ + 562.902032, + 343.577667 + ] + }, + { + "type": "polygon", + "color": [ + 71, + 22, + 229 + ], + "center": [ + 818.88886, + 219.94958 + ] + }, + { + "type": "rectangle", + "color": [ + 71, + 22, + 229 + ], + "center": [ + 831.492641, + 611.69447 + ] + }, + { + "type": "rectangle", + "color": [ + 22, + 229, + 33 + ], + "center": [ + 531.329767, + 630.471693 + ] + }, + { + "type": "polygon", + "color": [ + 168, + 229, + 22 + ], + "center": [ + 765.754875, + 896.816282 + ] + }, + { + "type": "polygon", + "color": [ + 22, + 229, + 33 + ], + "center": [ + 256.158952, + 275.698997 + ] + } + ], + "unique_shape_index": 4, + "unique_color": [ + 168, + 229, + 22 + ] + }, + "param_hash": "2564374ec1cf47b2", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/prompt.txt b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec40c24d053fb5230557a738f815755cea332b4e --- /dev/null +++ b/VBVR-Dataset/spot_unique_non_repeated_color_task/spot_unique_non_repeated_color_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 6 geometric shapes with different colors. Exactly one color appears only once, while every other color appears at least twice. First find the shape whose color is unique, then outline that entire shape with a black contour. Do not add any extra marks. Show the complete marking process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000000/final_frame.png b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b549c1a21e784f8731e87dbd99b969992e68d6d0 Binary files /dev/null and b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/final_frame.png differ diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000000/first_frame.png b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2d81cb394a87c9581574c5c68702685211e9eaa3 Binary files /dev/null and b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/first_frame.png differ diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000000/ground_truth.mp4 b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6825a5136b5745fd62559c2a38592120124c240d --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b4b0c629f278e209f0604b36e18b4ce32cae020b1cbdcab32623d8755bc6a3e +size 363044 diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000000/metadata.json b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..88af6c9182f2cfa95e87068fef70d5fc1ee96011 --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/metadata.json @@ -0,0 +1,129 @@ +{ + "task_id": "stable_sort_00000000", + "generator": "stable_sort", + "timestamp": "2026-02-17T07:26:08.455446", + "parameters": { + "groups": [ + [ + { + "type": "triangle", + "size": 66, + "color": [ + 230, + 105, + 105 + ], + "initial_position": [ + 213, + 97 + ], + "final_position": [ + 94, + 512 + ] + }, + { + "type": "triangle", + "size": 98, + "color": [ + 230, + 105, + 105 + ], + "initial_position": [ + 672, + 276 + ], + "final_position": [ + 218, + 512 + ] + }, + { + "type": "triangle", + "size": 147, + "color": [ + 230, + 105, + 105 + ], + "initial_position": [ + 631, + 765 + ], + "final_position": [ + 382, + 512 + ] + } + ], + [ + { + "type": "circle", + "size": 73, + "color": [ + 200, + 120, + 220 + ], + "initial_position": [ + 559, + 265 + ], + "final_position": [ + 534, + 512 + ] + }, + { + "type": "circle", + "size": 117, + "color": [ + 200, + 120, + 220 + ], + "initial_position": [ + 684, + 403 + ], + "final_position": [ + 671, + 512 + ] + }, + { + "type": "circle", + "size": 188, + "color": [ + 200, + 120, + 220 + ], + "initial_position": [ + 337, + 471 + ], + "final_position": [ + 866, + 512 + ] + } + ] + ], + "type_order": [ + "triangle", + "circle" + ] + }, + "param_hash": "b9906eaae7f4d54b", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000000/prompt.txt b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf4a029493ecf997b81d163c29a1ecab1adef05b --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000000/prompt.txt @@ -0,0 +1 @@ +The scene contains two types of shapes, each type has three shapes of different sizes arranged randomly. Keep all shapes unchanged in appearance (type, size, and color). Only rearrange their positions: first group the shapes by type, then within each group, sort the shapes from smallest to largest (left to right), and arrange all shapes in a single horizontal line from left to right. \ No newline at end of file diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000001/final_frame.png b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..77c061ec8ce8138d2d77224d738ca15eedaf4b40 Binary files /dev/null and b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/final_frame.png differ diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000001/first_frame.png b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..2a4995cbcf90543fa31a436f6fd8cc0955d78683 Binary files /dev/null and b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/first_frame.png differ diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000001/ground_truth.mp4 b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..bb8f437126e94addab8297fa7d81831e5d188cbe --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b36466aff75311f4f96a8a9aac61a6bf84ba99d46b330d33676e04b7b714391 +size 348296 diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000001/metadata.json b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..de998aa353342b77e504d627ba8c71f5f807520b --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/metadata.json @@ -0,0 +1,129 @@ +{ + "task_id": "stable_sort_00000001", + "generator": "stable_sort", + "timestamp": "2026-02-17T07:26:09.527471", + "parameters": { + "groups": [ + [ + { + "type": "square", + "size": 73, + "color": [ + 245, + 180, + 100 + ], + "initial_position": [ + 632, + 385 + ], + "final_position": [ + 97, + 512 + ] + }, + { + "type": "square", + "size": 109, + "color": [ + 245, + 180, + 100 + ], + "initial_position": [ + 749, + 173 + ], + "final_position": [ + 234, + 512 + ] + }, + { + "type": "square", + "size": 163, + "color": [ + 245, + 180, + 100 + ], + "initial_position": [ + 788, + 531 + ], + "final_position": [ + 416, + 512 + ] + } + ], + [ + { + "type": "triangle", + "size": 61, + "color": [ + 120, + 220, + 170 + ], + "initial_position": [ + 427, + 466 + ], + "final_position": [ + 574, + 512 + ] + }, + { + "type": "triangle", + "size": 100, + "color": [ + 120, + 220, + 170 + ], + "initial_position": [ + 598, + 627 + ], + "final_position": [ + 701, + 512 + ] + }, + { + "type": "triangle", + "size": 163, + "color": [ + 120, + 220, + 170 + ], + "initial_position": [ + 198, + 528 + ], + "final_position": [ + 878, + 512 + ] + } + ] + ], + "type_order": [ + "square", + "triangle" + ] + }, + "param_hash": "342df2714396d9fd", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000001/prompt.txt b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf4a029493ecf997b81d163c29a1ecab1adef05b --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000001/prompt.txt @@ -0,0 +1 @@ +The scene contains two types of shapes, each type has three shapes of different sizes arranged randomly. Keep all shapes unchanged in appearance (type, size, and color). Only rearrange their positions: first group the shapes by type, then within each group, sort the shapes from smallest to largest (left to right), and arrange all shapes in a single horizontal line from left to right. \ No newline at end of file diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000002/final_frame.png b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f2f4d4d86511cafa485d77d8e28d9b1ec814f884 Binary files /dev/null and b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/final_frame.png differ diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000002/first_frame.png b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..069c8d94739e955cea37214c440a211ef3cc0471 Binary files /dev/null and b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/first_frame.png differ diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000002/ground_truth.mp4 b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7af77aefca32ab27dfa65a5d3c17567dea42dd2c --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffc993b7bed79048f9b27b3a1af553d16653358fd657073443e9be3492d9b3f +size 420627 diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000002/metadata.json b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0978f7ab865b44edf8ffa2145a4e48b729ba9cf5 --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/metadata.json @@ -0,0 +1,129 @@ +{ + "task_id": "stable_sort_00000002", + "generator": "stable_sort", + "timestamp": "2026-02-17T07:26:10.614253", + "parameters": { + "groups": [ + [ + { + "type": "triangle", + "size": 92, + "color": [ + 120, + 170, + 255 + ], + "initial_position": [ + 374, + 493 + ], + "final_position": [ + 107, + 512 + ] + }, + { + "type": "triangle", + "size": 143, + "color": [ + 120, + 170, + 255 + ], + "initial_position": [ + 610, + 494 + ], + "final_position": [ + 249, + 512 + ] + }, + { + "type": "triangle", + "size": 223, + "color": [ + 120, + 170, + 255 + ], + "initial_position": [ + 849, + 197 + ], + "final_position": [ + 457, + 512 + ] + } + ], + [ + { + "type": "circle", + "size": 62, + "color": [ + 120, + 170, + 255 + ], + "initial_position": [ + 318, + 383 + ], + "final_position": [ + 625, + 512 + ] + }, + { + "type": "circle", + "size": 99, + "color": [ + 120, + 170, + 255 + ], + "initial_position": [ + 775, + 614 + ], + "final_position": [ + 730, + 512 + ] + }, + { + "type": "circle", + "size": 158, + "color": [ + 120, + 170, + 255 + ], + "initial_position": [ + 440, + 667 + ], + "final_position": [ + 884, + 512 + ] + } + ] + ], + "type_order": [ + "triangle", + "circle" + ] + }, + "param_hash": "fb97ff4b5cac83b0", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/stable_sort_task/stable_sort_00000002/prompt.txt b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..bf4a029493ecf997b81d163c29a1ecab1adef05b --- /dev/null +++ b/VBVR-Dataset/stable_sort_task/stable_sort_00000002/prompt.txt @@ -0,0 +1 @@ +The scene contains two types of shapes, each type has three shapes of different sizes arranged randomly. Keep all shapes unchanged in appearance (type, size, and color). Only rearrange their positions: first group the shapes by type, then within each group, sort the shapes from smallest to largest (left to right), and arrange all shapes in a single horizontal line from left to right. \ No newline at end of file diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/final_frame.png b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c30bdba16fd6bfea51b7b019fd243af4b4988514 Binary files /dev/null and b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/final_frame.png differ diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/first_frame.png b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d57cf7ae40dee52655f8db945031f8adfd194fe9 Binary files /dev/null and b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/first_frame.png differ diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/ground_truth.mp4 b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..536f232f866d31990a3bca3a16598cdb04128cb3 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56003ccfc14e215258d63ac640681caf6dcede6d49461b0e0803d267a01169f1 +size 151639 diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/metadata.json b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..99d3b3a3d56537701f6de9673cec71695c33d890 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/metadata.json @@ -0,0 +1,254 @@ +{ + "task_id": "suppress_spurious_edges_00000000", + "generator": "suppress_spurious_edges", + "timestamp": "2026-02-17T07:31:48.875088", + "parameters": { + "shapes": [ + { + "type": "triangle", + "vertices": [ + [ + 386, + 403 + ], + [ + 202, + 722 + ], + [ + 570, + 722 + ] + ], + "fill_color": [ + 173, + 216, + 230 + ], + "outline_color": [ + 0, + 0, + 0 + ], + "edge_index": 0, + "spline_type": "wave", + "spline_points": [ + [ + 351, + 385 + ], + [ + 329, + 378 + ], + [ + 315, + 378 + ], + [ + 310, + 383 + ], + [ + 302, + 389 + ], + [ + 302, + 398 + ], + [ + 294, + 402 + ], + [ + 288, + 406 + ], + [ + 273, + 406 + ], + [ + 258, + 406 + ], + [ + 247, + 409 + ], + [ + 234, + 406 + ], + [ + 225, + 413 + ], + [ + 227, + 423 + ], + [ + 235, + 436 + ], + [ + 253, + 455 + ], + [ + 280, + 479 + ], + [ + 310, + 504 + ], + [ + 340, + 531 + ], + [ + 370, + 553 + ], + [ + 396, + 575 + ], + [ + 408, + 593 + ], + [ + 418, + 607 + ], + [ + 416, + 617 + ], + [ + 408, + 618 + ], + [ + 396, + 621 + ], + [ + 378, + 622 + ], + [ + 364, + 621 + ], + [ + 357, + 625 + ], + [ + 347, + 627 + ], + [ + 342, + 633 + ], + [ + 340, + 639 + ], + [ + 332, + 643 + ], + [ + 324, + 649 + ], + [ + 311, + 646 + ], + [ + 286, + 644 + ], + [ + 258, + 635 + ], + [ + 224, + 624 + ], + [ + 191, + 615 + ], + [ + 154, + 603 + ], + [ + 127, + 594 + ], + [ + 104, + 587 + ], + [ + 90, + 590 + ], + [ + 87, + 594 + ], + [ + 91, + 609 + ], + [ + 107, + 626 + ], + [ + 124, + 642 + ], + [ + 143, + 665 + ], + [ + 162, + 683 + ], + [ + 174, + 697 + ], + [ + 187, + 713 + ] + ] + } + ] + }, + "param_hash": "675bbe89650073a6", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/prompt.txt b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7187203ba1b363b71a18f5351007cd5bd8759a4 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows 1 geometric shape. One straight edge of the shape has an irregular spurious spline curve drawn on top of it (a wavy or zigzag line that does not match the straight edge). First identify the spurious spline curve(s), then smoothly fade out the spline curve(s) while keeping the original straight edge(s) unchanged. Keep the shapes fixed and do not add any new lines. Show the complete removal process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/final_frame.png b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..677efc718056a52e6d3896b37f5a70f26e106ae4 Binary files /dev/null and b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/final_frame.png differ diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/first_frame.png b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..287f0b40597f137386cbe61b4d90ebcc1d6928e4 Binary files /dev/null and b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/first_frame.png differ diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/ground_truth.mp4 b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..b3c4735265d9f4ca13c6374097c6c6ef82102180 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad98661845e1e271595fb456c725d2391ade99ff917f21867cbde5ae612e0d8d +size 235923 diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/metadata.json b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6383273bf383374008eddabf8bfdbc63bee96498 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/metadata.json @@ -0,0 +1,748 @@ +{ + "task_id": "suppress_spurious_edges_00000001", + "generator": "suppress_spurious_edges", + "timestamp": "2026-02-17T07:31:49.496119", + "parameters": { + "shapes": [ + { + "type": "pentagon", + "vertices": [ + [ + 267, + 295 + ], + [ + 39, + 461 + ], + [ + 126, + 729 + ], + [ + 408, + 729 + ], + [ + 495, + 461 + ] + ], + "fill_color": [ + 200, + 200, + 200 + ], + "outline_color": [ + 0, + 0, + 0 + ], + "edge_index": 1, + "spline_type": "wave", + "spline_points": [ + [ + -7, + 477 + ], + [ + 16, + 476 + ], + [ + 36, + 475 + ], + [ + 49, + 475 + ], + [ + 62, + 477 + ], + [ + 68, + 481 + ], + [ + 73, + 485 + ], + [ + 81, + 488 + ], + [ + 95, + 492 + ], + [ + 111, + 493 + ], + [ + 123, + 492 + ], + [ + 139, + 495 + ], + [ + 143, + 499 + ], + [ + 136, + 506 + ], + [ + 117, + 517 + ], + [ + 92, + 532 + ], + [ + 69, + 546 + ], + [ + 44, + 558 + ], + [ + 25, + 573 + ], + [ + 19, + 579 + ], + [ + 19, + 584 + ], + [ + 20, + 592 + ], + [ + 26, + 596 + ], + [ + 30, + 598 + ], + [ + 31, + 607 + ], + [ + 25, + 613 + ], + [ + 23, + 618 + ], + [ + 28, + 625 + ], + [ + 38, + 627 + ], + [ + 60, + 624 + ], + [ + 88, + 621 + ], + [ + 117, + 619 + ], + [ + 143, + 615 + ], + [ + 168, + 613 + ], + [ + 176, + 619 + ], + [ + 180, + 621 + ], + [ + 172, + 633 + ], + [ + 157, + 641 + ], + [ + 150, + 652 + ], + [ + 139, + 661 + ], + [ + 137, + 666 + ], + [ + 133, + 672 + ], + [ + 134, + 681 + ], + [ + 126, + 685 + ], + [ + 115, + 699 + ], + [ + 95, + 708 + ], + [ + 75, + 720 + ], + [ + 53, + 736 + ], + [ + 37, + 747 + ], + [ + 34, + 750 + ], + [ + 42, + 756 + ] + ] + }, + { + "type": "pentagon", + "vertices": [ + [ + 832, + 547 + ], + [ + 723, + 627 + ], + [ + 765, + 755 + ], + [ + 899, + 755 + ], + [ + 941, + 627 + ] + ], + "fill_color": [ + 255, + 182, + 193 + ], + "outline_color": [ + 50, + 50, + 50 + ], + "edge_index": 2, + "spline_type": "wave", + "spline_points": [ + [ + 767, + 767 + ], + [ + 767, + 768 + ], + [ + 771, + 772 + ], + [ + 775, + 773 + ], + [ + 774, + 771 + ], + [ + 780, + 775 + ], + [ + 782, + 772 + ], + [ + 782, + 774 + ], + [ + 785, + 775 + ], + [ + 787, + 775 + ], + [ + 789, + 775 + ], + [ + 794, + 774 + ], + [ + 797, + 780 + ], + [ + 798, + 781 + ], + [ + 800, + 783 + ], + [ + 805, + 781 + ], + [ + 807, + 786 + ], + [ + 811, + 782 + ], + [ + 815, + 783 + ], + [ + 817, + 782 + ], + [ + 817, + 779 + ], + [ + 820, + 778 + ], + [ + 824, + 773 + ], + [ + 824, + 764 + ], + [ + 830, + 759 + ], + [ + 831, + 754 + ], + [ + 833, + 749 + ], + [ + 839, + 740 + ], + [ + 841, + 734 + ], + [ + 844, + 729 + ], + [ + 845, + 728 + ], + [ + 847, + 723 + ], + [ + 852, + 722 + ], + [ + 853, + 722 + ], + [ + 858, + 725 + ], + [ + 860, + 726 + ], + [ + 860, + 726 + ], + [ + 865, + 731 + ], + [ + 865, + 730 + ], + [ + 867, + 733 + ], + [ + 874, + 737 + ], + [ + 872, + 736 + ], + [ + 877, + 738 + ], + [ + 878, + 740 + ], + [ + 884, + 737 + ], + [ + 886, + 740 + ], + [ + 887, + 740 + ], + [ + 890, + 740 + ], + [ + 891, + 738 + ], + [ + 896, + 743 + ], + [ + 898, + 742 + ] + ] + }, + { + "type": "pentagon", + "vertices": [ + [ + 774, + 48 + ], + [ + 563, + 202 + ], + [ + 644, + 449 + ], + [ + 904, + 449 + ], + [ + 985, + 202 + ] + ], + "fill_color": [ + 255, + 182, + 193 + ], + "outline_color": [ + 50, + 50, + 50 + ], + "edge_index": 3, + "spline_type": "zigzag", + "spline_points": [ + [ + 936, + 458 + ], + [ + 928, + 453 + ], + [ + 922, + 442 + ], + [ + 918, + 437 + ], + [ + 909, + 426 + ], + [ + 901, + 421 + ], + [ + 894, + 412 + ], + [ + 889, + 406 + ], + [ + 880, + 395 + ], + [ + 875, + 392 + ], + [ + 868, + 380 + ], + [ + 874, + 379 + ], + [ + 885, + 375 + ], + [ + 893, + 377 + ], + [ + 906, + 371 + ], + [ + 914, + 369 + ], + [ + 924, + 368 + ], + [ + 936, + 367 + ], + [ + 948, + 362 + ], + [ + 955, + 360 + ], + [ + 969, + 360 + ], + [ + 977, + 356 + ], + [ + 987, + 355 + ], + [ + 994, + 352 + ], + [ + 986, + 343 + ], + [ + 980, + 337 + ], + [ + 973, + 327 + ], + [ + 964, + 320 + ], + [ + 955, + 312 + ], + [ + 952, + 305 + ], + [ + 941, + 295 + ], + [ + 938, + 290 + ], + [ + 927, + 283 + ], + [ + 921, + 274 + ], + [ + 914, + 264 + ], + [ + 908, + 260 + ], + [ + 917, + 257 + ], + [ + 926, + 254 + ], + [ + 937, + 252 + ], + [ + 947, + 251 + ], + [ + 954, + 248 + ], + [ + 966, + 246 + ], + [ + 979, + 243 + ], + [ + 986, + 239 + ], + [ + 996, + 236 + ], + [ + 1009, + 236 + ], + [ + 1017, + 235 + ], + [ + 1026, + 231 + ], + [ + 1034, + 227 + ], + [ + 1025, + 221 + ], + [ + 1020, + 214 + ] + ] + } + ] + }, + "param_hash": "4c7e14dd19278869", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/prompt.txt b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..ec5569b71cc9358033e0616b89a5955065ddf2fa --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows 3 geometric shapes. One straight edge of each shape has an irregular spurious spline curve drawn on top of it (a wavy or zigzag line that does not match the straight edge). First identify the spurious spline curve(s), then smoothly fade out the spline curve(s) while keeping the original straight edge(s) unchanged. Keep the shapes fixed and do not add any new lines. Show the complete removal process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/final_frame.png b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..89eb56cb5db0e5cc410a706f96f834c81e98445a Binary files /dev/null and b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/final_frame.png differ diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/first_frame.png b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..5d5a050e158ce0e42b4d0eca25189708939da54a Binary files /dev/null and b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/first_frame.png differ diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/ground_truth.mp4 b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..31da6bf55ff39f46a05e5cf940fc0f170a0b8605 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dda505aa13d8644aefddb8177319640dd7a8f81c7ac67692baf0b7d0f67b5e3 +size 139131 diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/metadata.json b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..11357637986e426a43e78d1e0401cb5bb78b334c --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/metadata.json @@ -0,0 +1,262 @@ +{ + "task_id": "suppress_spurious_edges_00000002", + "generator": "suppress_spurious_edges", + "timestamp": "2026-02-17T07:31:50.083175", + "parameters": { + "shapes": [ + { + "type": "pentagon", + "vertices": [ + [ + 727, + 417 + ], + [ + 507, + 578 + ], + [ + 591, + 836 + ], + [ + 863, + 836 + ], + [ + 947, + 578 + ] + ], + "fill_color": [ + 173, + 216, + 230 + ], + "outline_color": [ + 0, + 0, + 0 + ], + "edge_index": 0, + "spline_type": "wave", + "spline_points": [ + [ + 715, + 398 + ], + [ + 709, + 405 + ], + [ + 710, + 409 + ], + [ + 703, + 412 + ], + [ + 700, + 417 + ], + [ + 698, + 427 + ], + [ + 700, + 433 + ], + [ + 696, + 440 + ], + [ + 698, + 451 + ], + [ + 699, + 464 + ], + [ + 702, + 473 + ], + [ + 707, + 488 + ], + [ + 710, + 500 + ], + [ + 708, + 514 + ], + [ + 713, + 527 + ], + [ + 712, + 534 + ], + [ + 712, + 544 + ], + [ + 705, + 546 + ], + [ + 703, + 548 + ], + [ + 696, + 546 + ], + [ + 687, + 544 + ], + [ + 675, + 539 + ], + [ + 662, + 533 + ], + [ + 649, + 524 + ], + [ + 636, + 516 + ], + [ + 626, + 511 + ], + [ + 614, + 506 + ], + [ + 604, + 500 + ], + [ + 595, + 496 + ], + [ + 586, + 492 + ], + [ + 581, + 495 + ], + [ + 576, + 496 + ], + [ + 568, + 497 + ], + [ + 565, + 501 + ], + [ + 556, + 503 + ], + [ + 554, + 504 + ], + [ + 548, + 504 + ], + [ + 541, + 504 + ], + [ + 530, + 501 + ], + [ + 523, + 498 + ], + [ + 517, + 499 + ], + [ + 508, + 493 + ], + [ + 497, + 491 + ], + [ + 489, + 492 + ], + [ + 484, + 493 + ], + [ + 481, + 496 + ], + [ + 479, + 503 + ], + [ + 475, + 508 + ], + [ + 477, + 521 + ], + [ + 480, + 531 + ], + [ + 486, + 546 + ] + ] + } + ] + }, + "param_hash": "2982817c949a863a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/prompt.txt b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7187203ba1b363b71a18f5351007cd5bd8759a4 --- /dev/null +++ b/VBVR-Dataset/suppress_spurious_edges_task/suppress_spurious_edges_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows 1 geometric shape. One straight edge of the shape has an irregular spurious spline curve drawn on top of it (a wavy or zigzag line that does not match the straight edge). First identify the spurious spline curve(s), then smoothly fade out the spline curve(s) while keeping the original straight edge(s) unchanged. Keep the shapes fixed and do not add any new lines. Show the complete removal process step by step. \ No newline at end of file diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/final_frame.png b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1262a2c5375130359f39c5c5dbd8423cfb2809e5 Binary files /dev/null and b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/final_frame.png differ diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/first_frame.png b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d0c94035cc23003899ec6699dfa1b0af9dba64f3 Binary files /dev/null and b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/first_frame.png differ diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/ground_truth.mp4 b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7cc17316379ef8b4d8771eab31b1e8bb94570d6b --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8571eb85be375b6b0b6720f7716d238f8626344945cfbeed6624e8ddd8c2a2bb +size 185524 diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/metadata.json b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..f976f41b2303855dffe3a4e2d850a92f839f5ee4 --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/metadata.json @@ -0,0 +1,96 @@ +{ + "task_id": "symbol_reordering_00000000", + "generator": "symbol_reordering", + "timestamp": "2026-02-17T07:52:14.105940", + "parameters": { + "symbol_type": "mixed", + "initial_sequence": [ + 0, + 2, + 3, + 1 + ], + "target_sequence": [ + 0, + 1, + 2, + 3 + ], + "objects": [ + { + "symbol": "B", + "initial_center": [ + 120, + 512 + ], + "target_center": [ + 120, + 512 + ], + "color": [ + 100, + 150, + 250 + ] + }, + { + "symbol": "triangle", + "initial_center": [ + 421, + 512 + ], + "target_center": [ + 722, + 512 + ], + "color": [ + 150, + 100, + 200 + ] + }, + { + "symbol": "2", + "initial_center": [ + 722, + 512 + ], + "target_center": [ + 904, + 512 + ], + "color": [ + 250, + 150, + 100 + ] + }, + { + "symbol": "1", + "initial_center": [ + 904, + 512 + ], + "target_center": [ + 421, + 512 + ], + "color": [ + 250, + 150, + 100 + ] + } + ] + }, + "param_hash": "569ec8413bd3d070", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/prompt.txt b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..03925a18165f25e3e78f8ed2de7ace27d2a993e4 --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a sequence of 4 mixed symbols arranged horizontally from left to right. Position labels (0 to 3) are shown below each symbol, indicating the target position where each symbol should move to. In symbol reordering tasks, each symbol must move from its current position to its target position indicated by the position label shown below it. The reordering rule is: first identify each symbol's current position in the sequence (from left to right, starting at position 0), then read the target position label below the symbol to determine where it should move, then move the symbol horizontally to that target position. Observe the initial sequence and read the position labels to determine where each symbol should move. Animate each symbol moving smoothly from its current position to its target position, ensuring all symbols reach their exact final locations as specified by the position labels. \ No newline at end of file diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/final_frame.png b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f17c6fa8280f0e7c5c5bb8d8efe061a1e83b7353 Binary files /dev/null and b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/final_frame.png differ diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/first_frame.png b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..48e6e1788c6e3bbaeb5299d96e42731521687664 Binary files /dev/null and b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/first_frame.png differ diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/ground_truth.mp4 b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..655823aab6e4f976ce781f0b226ae13058123454 --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48da99f228ca5d14e552704d11467a7225cbf294c8acfc4cf579da947a891d29 +size 221184 diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/metadata.json b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..25410bbedb2b52cbcb3fa2ef4b1875f602490144 --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/metadata.json @@ -0,0 +1,114 @@ +{ + "task_id": "symbol_reordering_00000001", + "generator": "symbol_reordering", + "timestamp": "2026-02-17T07:52:14.805571", + "parameters": { + "symbol_type": "letters", + "initial_sequence": [ + 0, + 3, + 1, + 2, + 4 + ], + "target_sequence": [ + 0, + 1, + 2, + 3, + 4 + ], + "objects": [ + { + "symbol": "M", + "initial_center": [ + 120, + 512 + ], + "target_center": [ + 120, + 512 + ], + "color": [ + 100, + 150, + 250 + ] + }, + { + "symbol": "D", + "initial_center": [ + 346, + 512 + ], + "target_center": [ + 798, + 512 + ], + "color": [ + 100, + 150, + 250 + ] + }, + { + "symbol": "U", + "initial_center": [ + 572, + 512 + ], + "target_center": [ + 346, + 512 + ], + "color": [ + 100, + 150, + 250 + ] + }, + { + "symbol": "T", + "initial_center": [ + 798, + 512 + ], + "target_center": [ + 572, + 512 + ], + "color": [ + 100, + 150, + 250 + ] + }, + { + "symbol": "Q", + "initial_center": [ + 904, + 512 + ], + "target_center": [ + 904, + 512 + ], + "color": [ + 100, + 150, + 250 + ] + } + ] + }, + "param_hash": "6f9ebcfd717f1a86", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/prompt.txt b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..e315a9cee1431abd51fc2a1f1748e80f5a606f2b --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a sequence of 5 letter symbols arranged horizontally from left to right. Position labels (0 to 4) are shown below each symbol, indicating the target position where each symbol should move to. In symbol reordering tasks, each symbol must move from its current position to its target position indicated by the position label shown below it. The reordering rule is: first identify each symbol's current position in the sequence (from left to right, starting at position 0), then read the target position label below the symbol to determine where it should move, then move the symbol horizontally to that target position. Observe the initial sequence and read the position labels to determine where each symbol should move. Animate each symbol moving smoothly from its current position to its target position, ensuring all symbols reach their exact final locations as specified by the position labels. \ No newline at end of file diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/final_frame.png b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..02b4aefbc4baf4d3286ea302a92226ea624238f5 Binary files /dev/null and b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/final_frame.png differ diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/first_frame.png b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8e6bd941aac19c26d7b6d9fddedac06ffa3a34e7 Binary files /dev/null and b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/first_frame.png differ diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/ground_truth.mp4 b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7fd5d5651ff50d3c6c34f6437f448c606ececf4a --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d7295891594ce4c8c64b362f1f480868e75ff2bd5bd9670c94652c34f832e7 +size 296988 diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/metadata.json b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8b1fe98e73914b171e87c23ee999623226f32a0a --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/metadata.json @@ -0,0 +1,150 @@ +{ + "task_id": "symbol_reordering_00000002", + "generator": "symbol_reordering", + "timestamp": "2026-02-17T07:52:15.478358", + "parameters": { + "symbol_type": "shapes", + "initial_sequence": [ + 0, + 2, + 3, + 1, + 6, + 5, + 4 + ], + "target_sequence": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6 + ], + "objects": [ + { + "symbol": "triangle", + "initial_center": [ + 120, + 281 + ], + "target_center": [ + 120, + 281 + ], + "color": [ + 150, + 100, + 200 + ] + }, + { + "symbol": "circle", + "initial_center": [ + 361, + 281 + ], + "target_center": [ + 662, + 281 + ], + "color": [ + 100, + 200, + 100 + ] + }, + { + "symbol": "hexagon", + "initial_center": [ + 662, + 281 + ], + "target_center": [ + 904, + 281 + ], + "color": [ + 200, + 150, + 100 + ] + }, + { + "symbol": "diamond", + "initial_center": [ + 904, + 281 + ], + "target_center": [ + 361, + 281 + ], + "color": [ + 200, + 200, + 100 + ] + }, + { + "symbol": "square", + "initial_center": [ + 120, + 743 + ], + "target_center": [ + 904, + 743 + ], + "color": [ + 200, + 100, + 100 + ] + }, + { + "symbol": "pentagon", + "initial_center": [ + 512, + 743 + ], + "target_center": [ + 512, + 743 + ], + "color": [ + 100, + 150, + 200 + ] + }, + { + "symbol": "heart", + "initial_center": [ + 904, + 743 + ], + "target_center": [ + 120, + 743 + ], + "color": [ + 255, + 100, + 150 + ] + } + ] + }, + "param_hash": "5d36183f35a52da1", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/prompt.txt b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..772e297501c46869dd9c7ce3dfc542d5d4d8a17a --- /dev/null +++ b/VBVR-Dataset/symbol_reordering_task/symbol_reordering_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a sequence of 7 geometric shapes arranged horizontally from left to right. Position labels (0 to 6) are shown below each symbol, indicating the target position where each symbol should move to. In symbol reordering tasks, each symbol must move from its current position to its target position indicated by the position label shown below it. The reordering rule is: first identify each symbol's current position in the sequence (from left to right, starting at position 0), then read the target position label below the symbol to determine where it should move, then move the symbol horizontally to that target position. Observe the initial sequence and read the position labels to determine where each symbol should move. Animate each symbol moving smoothly from its current position to its target position, ensuring all symbols reach their exact final locations as specified by the position labels. \ No newline at end of file diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/final_frame.png b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..80cbb3cc16b6d5e530695a062edd74822edf645e Binary files /dev/null and b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/final_frame.png differ diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/first_frame.png b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..7f394a9c7cf3772db3b53a0126b55fd0cf542717 Binary files /dev/null and b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/first_frame.png differ diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/ground_truth.mp4 b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..ad529f9f4adb511dba25b5c0d36e1edcc2a6d764 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72d8622fc64c73f28e1387a05426ad474370bbb2515ef5589f667e3737ee0820 +size 155349 diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/metadata.json b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb99e03eef5b60c9b4393d37e400e3f13107727 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "symbol_worlds_symbol_editing_00000000", + "generator": "symbol_worlds_symbol_editing", + "timestamp": "2026-02-17T07:58:00.003336", + "parameters": { + "symbols": [ + { + "shape": "hexagon", + "color": "pink", + "color_rgb": [ + 255, + 100, + 150 + ] + }, + { + "shape": "diamond", + "color": "green", + "color_rgb": [ + 50, + 180, + 50 + ] + }, + { + "shape": "circle", + "color": "cyan", + "color_rgb": [ + 50, + 200, + 200 + ] + }, + { + "shape": "circle", + "color": "purple", + "color_rgb": [ + 180, + 50, + 180 + ] + } + ], + "target_index": 2, + "new_symbol": { + "shape": "triangle", + "color": "orange", + "color_rgb": [ + 255, + 140, + 50 + ] + } + }, + "param_hash": "a9ef23bbb043c2cc", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/prompt.txt b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..cd98049c6063314fc75478e1cd4d21203e684773 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a horizontal sequence of colored geometric symbols arranged from left to right. Each symbol is a distinct geometric shape with a specific color, and exactly one symbol is marked as the substitution target by a red rectangular border surrounding it. In symbol substitution tasks, the target symbol identified by the red border must be replaced with a new symbol while all other symbols remain unchanged in their original positions. First identify the symbol marked with the red border, then replace it with a orange triangle. The final state must show the sequence with the target symbol substituted by the orange triangle at the same position, while all other symbols retain their original shapes, colors, and sequential positions. The substitution operation affects only the single marked symbol, replacing it with the orange triangle. \ No newline at end of file diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/final_frame.png b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..51e9c9280f5ec90922dbd7fc6db851a6a1e63ac6 Binary files /dev/null and b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/final_frame.png differ diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/first_frame.png b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..1628038814cf1be7119e8878478bc1905500407d Binary files /dev/null and b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/first_frame.png differ diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/ground_truth.mp4 b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..878efd621d72fd0e8a52d7f29304ffa6fbbca896 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2fd04694c1f190862722c2bb28f867d8eba8776e9068aa0c8a051b438128be +size 159003 diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/metadata.json b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a47da7f7b1152a1f2dfaffd8a27d9911a7a484bd --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/metadata.json @@ -0,0 +1,83 @@ +{ + "task_id": "symbol_worlds_symbol_editing_00000001", + "generator": "symbol_worlds_symbol_editing", + "timestamp": "2026-02-17T07:58:00.784279", + "parameters": { + "symbols": [ + { + "shape": "triangle", + "color": "cyan", + "color_rgb": [ + 50, + 200, + 200 + ] + }, + { + "shape": "square", + "color": "green", + "color_rgb": [ + 50, + 180, + 50 + ] + }, + { + "shape": "star", + "color": "blue", + "color_rgb": [ + 50, + 100, + 220 + ] + }, + { + "shape": "circle", + "color": "pink", + "color_rgb": [ + 255, + 100, + 150 + ] + }, + { + "shape": "hexagon", + "color": "red", + "color_rgb": [ + 220, + 50, + 50 + ] + }, + { + "shape": "hexagon", + "color": "purple", + "color_rgb": [ + 180, + 50, + 180 + ] + } + ], + "target_index": 4, + "new_symbol": { + "shape": "hexagon", + "color": "cyan", + "color_rgb": [ + 50, + 200, + 200 + ] + } + }, + "param_hash": "29413999e8daab85", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/prompt.txt b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..72aff120f94fccce0b4acb25eaca2796dbc59d3c --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a horizontal sequence of colored geometric symbols arranged from left to right. Each symbol is a distinct geometric shape with a specific color, and exactly one symbol is marked as the substitution target by a red rectangular border surrounding it. In symbol substitution tasks, the target symbol identified by the red border must be replaced with a new symbol while all other symbols remain unchanged in their original positions. First identify the symbol marked with the red border, then replace it with a cyan hexagon. The final state must show the sequence with the target symbol substituted by the cyan hexagon at the same position, while all other symbols retain their original shapes, colors, and sequential positions. The substitution operation affects only the single marked symbol, replacing it with the cyan hexagon. \ No newline at end of file diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/final_frame.png b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..55b6af916f9a359d352446e974362c5b8092c344 Binary files /dev/null and b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/final_frame.png differ diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/first_frame.png b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..eb70f40cce056c131c8c2557fd4ea581ad537f0b Binary files /dev/null and b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/first_frame.png differ diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/ground_truth.mp4 b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c515a34357e970c702438aa50521aa6fc9725786 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9782e06c0b1bc3671b24af64b5976f53d8e8fbb5ee950b64ef2570d4ad2863 +size 170780 diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/metadata.json b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..548d172204130f2abd8dcff8910298545d0ee764 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/metadata.json @@ -0,0 +1,92 @@ +{ + "task_id": "symbol_worlds_symbol_editing_00000002", + "generator": "symbol_worlds_symbol_editing", + "timestamp": "2026-02-17T07:58:01.611980", + "parameters": { + "symbols": [ + { + "shape": "diamond", + "color": "pink", + "color_rgb": [ + 255, + 100, + 150 + ] + }, + { + "shape": "square", + "color": "red", + "color_rgb": [ + 220, + 50, + 50 + ] + }, + { + "shape": "triangle", + "color": "purple", + "color_rgb": [ + 180, + 50, + 180 + ] + }, + { + "shape": "triangle", + "color": "blue", + "color_rgb": [ + 50, + 100, + 220 + ] + }, + { + "shape": "diamond", + "color": "cyan", + "color_rgb": [ + 50, + 200, + 200 + ] + }, + { + "shape": "circle", + "color": "red", + "color_rgb": [ + 220, + 50, + 50 + ] + }, + { + "shape": "hexagon", + "color": "cyan", + "color_rgb": [ + 50, + 200, + 200 + ] + } + ], + "target_index": 0, + "new_symbol": { + "shape": "circle", + "color": "pink", + "color_rgb": [ + 255, + 100, + 150 + ] + } + }, + "param_hash": "74054aab05b88f84", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/prompt.txt b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..66c0bfbfe2222d787f97a26a41942ccc52eff0b8 --- /dev/null +++ b/VBVR-Dataset/symbol_worlds_symbol_editing_task/symbol_worlds_symbol_editing_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a horizontal sequence of colored geometric symbols arranged from left to right. Each symbol is a distinct geometric shape with a specific color, and exactly one symbol is marked as the substitution target by a red rectangular border surrounding it. In symbol substitution tasks, the target symbol identified by the red border must be replaced with a new symbol while all other symbols remain unchanged in their original positions. First identify the symbol marked with the red border, then replace it with a pink circle. The final state must show the sequence with the target symbol substituted by the pink circle at the same position, while all other symbols retain their original shapes, colors, and sequential positions. The substitution operation affects only the single marked symbol, replacing it with the pink circle. \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/final_frame.png b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..69c92f81a39744b48cac5ea17eb0d4c6cc4c8826 Binary files /dev/null and b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/final_frame.png differ diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/first_frame.png b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..afce83e07ff1ac2e096910362be0f8b6121e7a41 Binary files /dev/null and b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/first_frame.png differ diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/ground_truth.mp4 b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..6b982e3f1defabe697a1f748db6c1735d533f24d --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c228eb3669cfcdce3ae4444c5411418b5ff4e4aaf8583114c755f3c4dd411d2 +size 358912 diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/metadata.json b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..869231120a6d2ecf23dc2deeff812ba948131ca3 --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/metadata.json @@ -0,0 +1,78 @@ +{ + "task_id": "symmetry_random_00000000", + "generator": "symmetry_random", + "timestamp": "2026-02-17T07:24:21.677240", + "parameters": { + "color": [ + 74, + 68, + 220 + ], + "grid_size": 9, + "scatter_size": 13, + "initial_scatter": [ + [ + 0, + 0 + ], + [ + 0, + 1 + ], + [ + 1, + 1 + ], + [ + 3, + 2 + ], + [ + 4, + 3 + ], + [ + 5, + 1 + ], + [ + 5, + 2 + ], + [ + 6, + 0 + ], + [ + 6, + 1 + ], + [ + 6, + 2 + ], + [ + 6, + 3 + ], + [ + 7, + 2 + ], + [ + 8, + 2 + ] + ] + }, + "param_hash": "0b2449c5e063d164", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/prompt.txt b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e49ac87224f3015c9b1f3f4bee9f734a2fedf3d --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a grid with a random scatter pattern on the left half. Expand the scatter pattern symmetrically to the right half by mirroring it across the vertical axis, creating a complete symmetric pattern. \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/final_frame.png b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..511e86c1aac353bcd95fd41cad41ed3bb633e258 Binary files /dev/null and b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/final_frame.png differ diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/first_frame.png b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c26217d79ca32fb469367b807780f3e7443ab3b1 Binary files /dev/null and b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/first_frame.png differ diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/ground_truth.mp4 b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..0f681e453920b5e7ba2daf5970f2902239e1045d --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ae7f7babfed47df0d6c04b8ae6f81d96b1a88aa8718efbdeac9e947e683113 +size 284145 diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/metadata.json b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1e68aa15977720fca20c5216fb457f40f4cac801 --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/metadata.json @@ -0,0 +1,82 @@ +{ + "task_id": "symmetry_random_00000001", + "generator": "symmetry_random", + "timestamp": "2026-02-17T07:24:22.368629", + "parameters": { + "color": [ + 217, + 254, + 153 + ], + "grid_size": 12, + "scatter_size": 14, + "initial_scatter": [ + [ + 0, + 3 + ], + [ + 0, + 4 + ], + [ + 0, + 5 + ], + [ + 1, + 0 + ], + [ + 3, + 2 + ], + [ + 5, + 1 + ], + [ + 5, + 2 + ], + [ + 5, + 4 + ], + [ + 6, + 3 + ], + [ + 7, + 2 + ], + [ + 7, + 5 + ], + [ + 8, + 2 + ], + [ + 9, + 2 + ], + [ + 11, + 3 + ] + ] + }, + "param_hash": "9c9a95f939d93fab", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/prompt.txt b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e49ac87224f3015c9b1f3f4bee9f734a2fedf3d --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a grid with a random scatter pattern on the left half. Expand the scatter pattern symmetrically to the right half by mirroring it across the vertical axis, creating a complete symmetric pattern. \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/final_frame.png b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0f05c7d85872b02d0a5d1a49d9a73a4485a8938d Binary files /dev/null and b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/final_frame.png differ diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/first_frame.png b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d17cb3284583a443db20bc91579ef86129fb2589 Binary files /dev/null and b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/first_frame.png differ diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/ground_truth.mp4 b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..43ac3dad6ac667376af8678c9e4bde420c186e91 --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56b42ef243e5ed933af58e733d246d3e420f1d055a661fb3dd0848e82ce9100 +size 265447 diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/metadata.json b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..085e3d3a8d56e735c4736eb0eed39216af857997 --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/metadata.json @@ -0,0 +1,58 @@ +{ + "task_id": "symmetry_random_00000002", + "generator": "symmetry_random", + "timestamp": "2026-02-17T07:24:23.085648", + "parameters": { + "color": [ + 161, + 178, + 205 + ], + "grid_size": 10, + "scatter_size": 8, + "initial_scatter": [ + [ + 2, + 1 + ], + [ + 3, + 0 + ], + [ + 3, + 3 + ], + [ + 5, + 1 + ], + [ + 6, + 1 + ], + [ + 7, + 3 + ], + [ + 9, + 1 + ], + [ + 9, + 4 + ] + ] + }, + "param_hash": "34d4b1a13c1d98ae", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/prompt.txt b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..0e49ac87224f3015c9b1f3f4bee9f734a2fedf3d --- /dev/null +++ b/VBVR-Dataset/symmetry_random_task/symmetry_random_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a grid with a random scatter pattern on the left half. Expand the scatter pattern symmetrically to the right half by mirroring it across the vertical axis, creating a complete symmetric pattern. \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/final_frame.png b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..02e221e8b495bd0a91458e79fb7698722b9da6aa Binary files /dev/null and b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/final_frame.png differ diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/first_frame.png b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..37b2f8b594000a2f7ba997d1d744dd7fa70a8d93 Binary files /dev/null and b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/first_frame.png differ diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/ground_truth.mp4 b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a55abbf5dce3cb333dbea7549f11b537f0745281 --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774670c6a8a969f070e246153777c5ac3163f40a98b6638196a8d1615dbd4fd6 +size 406389 diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/metadata.json b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..7aedc9dba2395255b90b8900aa8efc175181e54f --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/metadata.json @@ -0,0 +1,77 @@ +{ + "task_id": "symmetry_shape_00000000", + "generator": "symmetry_shape", + "timestamp": "2026-02-17T07:24:57.346026", + "parameters": { + "grid_size": 9, + "shape": [ + [ + 0, + 1 + ], + [ + 0, + 2 + ], + [ + 0, + 3 + ], + [ + 0, + 4 + ], + [ + 0, + 5 + ], + [ + 1, + 5 + ], + [ + 2, + 2 + ], + [ + 2, + 3 + ], + [ + 2, + 4 + ], + [ + 2, + 5 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ], + [ + 3, + 4 + ] + ], + "color": [ + 134, + 184, + 143 + ] + }, + "param_hash": "d717f23b497328b4", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/prompt.txt b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..35813027266c44425f3a458e6ae77168e2cdf3b0 --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a grid with a continuous shape on the left half. Expand the shape symmetrically to the right half by mirroring it across the vertical axis, creating a complete symmetric shape. \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/final_frame.png b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..6d58a4a14a85f2add4635ab0b56d1f669286f6cd Binary files /dev/null and b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/final_frame.png differ diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/first_frame.png b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..935eb67d77ab284d576989d69d1b07dbbee7f5cd Binary files /dev/null and b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/first_frame.png differ diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/ground_truth.mp4 b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..f5c46a64a0a1003bf1ec07061598bf3e972698ef --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61c4561284f466b24add9b80f35cc64bec879f85fdb2d57b7257d8597f16b502 +size 419688 diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/metadata.json b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..6fa2892fc1059ea5451ae9435028e97fe3d4133b --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/metadata.json @@ -0,0 +1,85 @@ +{ + "task_id": "symmetry_shape_00000001", + "generator": "symmetry_shape", + "timestamp": "2026-02-17T07:25:00.673501", + "parameters": { + "grid_size": 10, + "shape": [ + [ + 0, + 8 + ], + [ + 0, + 9 + ], + [ + 1, + 8 + ], + [ + 1, + 9 + ], + [ + 2, + 8 + ], + [ + 2, + 9 + ], + [ + 3, + 5 + ], + [ + 3, + 6 + ], + [ + 3, + 7 + ], + [ + 3, + 8 + ], + [ + 3, + 9 + ], + [ + 4, + 5 + ], + [ + 4, + 6 + ], + [ + 4, + 7 + ], + [ + 4, + 8 + ] + ], + "color": [ + 221, + 64, + 160 + ] + }, + "param_hash": "af6479bfbc578735", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/prompt.txt b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..35813027266c44425f3a458e6ae77168e2cdf3b0 --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a grid with a continuous shape on the left half. Expand the shape symmetrically to the right half by mirroring it across the vertical axis, creating a complete symmetric shape. \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/final_frame.png b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..262dbfcbfd905fa85b776e3ffa26d9b9bf0e29c2 Binary files /dev/null and b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/final_frame.png differ diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/first_frame.png b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8efcc0044f994417eee8d9c504b9f5081834a1e4 Binary files /dev/null and b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/first_frame.png differ diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/ground_truth.mp4 b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3be31160a9cabf811e880547c2f1e6c2bcf4230c --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00bac731d5c5c0b1f687e16e2e45d0fcc3f29e680d58b15b71b955c974fca45b +size 407435 diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/metadata.json b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..5a5b64095798155152e30111fd1d1f5ae05b3798 --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/metadata.json @@ -0,0 +1,53 @@ +{ + "task_id": "symmetry_shape_00000002", + "generator": "symmetry_shape", + "timestamp": "2026-02-17T07:25:02.491902", + "parameters": { + "grid_size": 12, + "shape": [ + [ + 1, + 0 + ], + [ + 1, + 1 + ], + [ + 2, + 1 + ], + [ + 2, + 2 + ], + [ + 2, + 3 + ], + [ + 3, + 2 + ], + [ + 3, + 3 + ] + ], + "color": [ + 142, + 126, + 114 + ] + }, + "param_hash": "12568f13440c11fc", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/prompt.txt b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..35813027266c44425f3a458e6ae77168e2cdf3b0 --- /dev/null +++ b/VBVR-Dataset/symmetry_shape_task/symmetry_shape_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a grid with a continuous shape on the left half. Expand the shape symmetrically to the right half by mirroring it across the vertical axis, creating a complete symmetric shape. \ No newline at end of file diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/final_frame.png b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..44d59f2b0f0c1db816b7b1535441d194ce58e1a0 Binary files /dev/null and b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/final_frame.png differ diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/first_frame.png b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8a64531ab33a729b9435a76c8c2111cf13c0f00a Binary files /dev/null and b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/first_frame.png differ diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/ground_truth.mp4 b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..04de6dcf8e034ed9679f7359500d31e7aa217287 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eabe67518fa3b731a652d8c7c161b14292e0fafcf5fea3b3eb04ed247c90801 +size 244578 diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/metadata.json b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9f616b10ec76166e4f4567f322828038b91e9352 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/metadata.json @@ -0,0 +1,73 @@ +{ + "task_id": "track_object_movement_00000000", + "generator": "track_object_movement", + "timestamp": "2026-02-17T07:35:24.275872", + "parameters": { + "objects": [ + { + "x": 727, + "y": 383, + "size": 115, + "shape": "heptagon", + "color": [ + 133, + 153, + 76 + ], + "is_target": true, + "is_tracked": false + }, + { + "x": 588, + "y": 627, + "size": 93, + "shape": "star", + "color": [ + 53, + 111, + 153 + ], + "is_target": false, + "is_tracked": true + }, + { + "x": 912, + "y": 312, + "size": 107, + "shape": "triangle", + "color": [ + 229, + 157, + 114 + ], + "is_target": false, + "is_tracked": false + }, + { + "x": 536, + "y": 770, + "size": 83, + "shape": "star", + "color": [ + 153, + 30, + 142 + ], + "is_target": false, + "is_tracked": false + } + ], + "target_x": 727, + "target_y": 627 + }, + "param_hash": "46557040ae14c719", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/prompt.txt b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..b881338d231d52395adeddf465775cd7e60e7ac0 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000000/prompt.txt @@ -0,0 +1 @@ +The object marked with a green border is the only object that moves. It moves horizontally to align directly below the object with a red star at its center. Track the movement with the green border as the object moves. \ No newline at end of file diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/final_frame.png b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ab14ac5f7ac2b10c94aa60c66be3ca0b518f5907 Binary files /dev/null and b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/final_frame.png differ diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/first_frame.png b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..b28881746c980daba4dc8559b313517bb3440c8e Binary files /dev/null and b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/first_frame.png differ diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/ground_truth.mp4 b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..5aeb001872804a249f9feb15690728035b146f4c --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:851812581a4a205b295bb4743d436bbc377ef65245058e7272899c000241a520 +size 231794 diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/metadata.json b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..952320c69c23b5c4400ae5767623061808f13686 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/metadata.json @@ -0,0 +1,86 @@ +{ + "task_id": "track_object_movement_00000001", + "generator": "track_object_movement", + "timestamp": "2026-02-17T07:35:24.979066", + "parameters": { + "objects": [ + { + "x": 173, + "y": 443, + "size": 118, + "shape": "rectangle", + "color": [ + 153, + 30, + 142 + ], + "is_target": true, + "is_tracked": false + }, + { + "x": 107, + "y": 705, + "size": 105, + "shape": "star", + "color": [ + 229, + 114, + 186 + ], + "is_target": false, + "is_tracked": true + }, + { + "x": 630, + "y": 701, + "size": 109, + "shape": "square", + "color": [ + 80, + 185, + 229 + ], + "is_target": false, + "is_tracked": false + }, + { + "x": 641, + "y": 522, + "size": 94, + "shape": "rectangle", + "color": [ + 144, + 53, + 153 + ], + "is_target": false, + "is_tracked": false + }, + { + "x": 840, + "y": 348, + "size": 100, + "shape": "octagon", + "color": [ + 229, + 157, + 114 + ], + "is_target": false, + "is_tracked": false + } + ], + "target_x": 173, + "target_y": 705 + }, + "param_hash": "6491bec78ccc66c4", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/prompt.txt b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..b881338d231d52395adeddf465775cd7e60e7ac0 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000001/prompt.txt @@ -0,0 +1 @@ +The object marked with a green border is the only object that moves. It moves horizontally to align directly below the object with a red star at its center. Track the movement with the green border as the object moves. \ No newline at end of file diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/final_frame.png b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..70527bd21a42319f04802d05f37d6761f67e5f76 Binary files /dev/null and b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/final_frame.png differ diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/first_frame.png b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f26196dc0ce58b81b7d59bab6d5fad564412d794 Binary files /dev/null and b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/first_frame.png differ diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/ground_truth.mp4 b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..c8d6cc31234fdf864a1e06b750831a2d1f50da0f --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61a6576c27d10bf2092d219d98b9b5a8ae9ad1c19527e59a270e276fb813be9 +size 204224 diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/metadata.json b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ea7284469ae9745070c2d3f88212da02d57049a0 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/metadata.json @@ -0,0 +1,86 @@ +{ + "task_id": "track_object_movement_00000002", + "generator": "track_object_movement", + "timestamp": "2026-02-17T07:35:25.709088", + "parameters": { + "objects": [ + { + "x": 817, + "y": 401, + "size": 92, + "shape": "triangle", + "color": [ + 191, + 229, + 45 + ], + "is_target": true, + "is_tracked": false + }, + { + "x": 694, + "y": 636, + "size": 112, + "shape": "circle", + "color": [ + 145, + 229, + 45 + ], + "is_target": false, + "is_tracked": true + }, + { + "x": 484, + "y": 917, + "size": 88, + "shape": "octagon", + "color": [ + 40, + 30, + 153 + ], + "is_target": false, + "is_tracked": false + }, + { + "x": 344, + "y": 344, + "size": 116, + "shape": "rectangle", + "color": [ + 53, + 153, + 119 + ], + "is_target": false, + "is_tracked": false + }, + { + "x": 359, + "y": 666, + "size": 86, + "shape": "hexagon", + "color": [ + 153, + 95, + 76 + ], + "is_target": false, + "is_tracked": false + } + ], + "target_x": 817, + "target_y": 636 + }, + "param_hash": "5ce5037abbbdf369", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/prompt.txt b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..b881338d231d52395adeddf465775cd7e60e7ac0 --- /dev/null +++ b/VBVR-Dataset/track_object_movement_task/track_object_movement_00000002/prompt.txt @@ -0,0 +1 @@ +The object marked with a green border is the only object that moves. It moves horizontally to align directly below the object with a red star at its center. Track the movement with the green border as the object moves. \ No newline at end of file diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000000/final_frame.png b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c6e0ad284718330d442ca6d748f08507dcddeaf9 Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/final_frame.png differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000000/first_frame.png b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..71f9acff148fbfb63ee0ecc90d2b48ee6ac8f2c9 Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/first_frame.png differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000000/ground_truth.mp4 b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..7bf34c7fc4706ee2eb3cc99e7b29a628be6af3a0 Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/ground_truth.mp4 differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000000/metadata.json b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..cb0b455f2d88e171b4c97619509f98dbe7b61b2d --- /dev/null +++ b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/metadata.json @@ -0,0 +1,65 @@ +{ + "task_id": "traffic_light_00000000", + "generator": "traffic_light", + "timestamp": "2026-02-27T07:55:30.598178", + "parameters": { + "task_type": 1, + "time_elapsed": 4, + "num_active_lights": 4, + "active_directions": [ + "north", + "south", + "east", + "west" + ], + "enable_yellow_light": true, + "objects": [ + { + "symbol": "light_north", + "direction": "north", + "initial_state": "green", + "initial_countdown": 1, + "final_state": "yellow", + "final_countdown": 1, + "is_active": true + }, + { + "symbol": "light_south", + "direction": "south", + "initial_state": "red", + "initial_countdown": 4, + "final_state": "yellow", + "final_countdown": 4, + "is_active": true + }, + { + "symbol": "light_east", + "direction": "east", + "initial_state": "green", + "initial_countdown": 4, + "final_state": "yellow", + "final_countdown": 4, + "is_active": true + }, + { + "symbol": "light_west", + "direction": "west", + "initial_state": "green", + "initial_countdown": 4, + "final_state": "yellow", + "final_countdown": 4, + "is_active": true + } + ] + }, + "param_hash": "0efeebdce634e723", + "generation": { + "seed": 2026, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000000/prompt.txt b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..2df89f1b88d771a4fe1dd41445cfd1596c86c416 --- /dev/null +++ b/VBVR-Dataset/traffic_light_task/traffic_light_00000000/prompt.txt @@ -0,0 +1 @@ +This scene shows a crossroad with four traffic lights (North, South, East, West). Each light independently follows a 3-color cycle: Red (4s) → Yellow (4s) → Green (4s) → Yellow (4s) → Red. Currently: North light is green with 1s countdown, South light is red with 4s countdown, East light is green with 4s countdown, West light is green with 4s countdown. Simulate 4 seconds and show the final state of all four traffic lights. \ No newline at end of file diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000001/final_frame.png b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ef7009ef23887bcb4c6940a2ab8ba9c3c69042a3 Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/final_frame.png differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000001/first_frame.png b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0acd939abca1b04d27d638132f628550ecde2b36 Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/first_frame.png differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000001/ground_truth.mp4 b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..cb396d83ced051846a9326ce49c22b9bfcf8328b Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/ground_truth.mp4 differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000001/metadata.json b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..1886e3b4698c4c426a296d4fdf9497b92dd425f9 --- /dev/null +++ b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/metadata.json @@ -0,0 +1,63 @@ +{ + "task_id": "traffic_light_00000001", + "generator": "traffic_light", + "timestamp": "2026-02-27T07:55:30.714957", + "parameters": { + "task_type": 1, + "time_elapsed": 3, + "num_active_lights": 2, + "active_directions": [ + "north", + "south" + ], + "enable_yellow_light": true, + "objects": [ + { + "symbol": "light_north", + "direction": "north", + "initial_state": "yellow", + "initial_countdown": 1, + "final_state": "red", + "final_countdown": 2, + "is_active": true + }, + { + "symbol": "light_south", + "direction": "south", + "initial_state": "yellow", + "initial_countdown": 1, + "final_state": "red", + "final_countdown": 2, + "is_active": true + }, + { + "symbol": "light_east", + "direction": "east", + "initial_state": null, + "initial_countdown": 0, + "final_state": null, + "final_countdown": 0, + "is_active": false + }, + { + "symbol": "light_west", + "direction": "west", + "initial_state": null, + "initial_countdown": 0, + "final_state": null, + "final_countdown": 0, + "is_active": false + } + ] + }, + "param_hash": "f09289b466ca771e", + "generation": { + "seed": 2026, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000001/prompt.txt b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..9cc076b1233123fc32d189c4e05490abefbe1dfb --- /dev/null +++ b/VBVR-Dataset/traffic_light_task/traffic_light_00000001/prompt.txt @@ -0,0 +1 @@ +This scene shows a crossroad with two traffic lights (North, South). Each light independently follows a 3-color cycle: Red (4s) → Yellow (4s) → Green (4s) → Yellow (4s) → Red. Currently: North light is yellow with 1s countdown, South light is yellow with 1s countdown. Simulate 3 seconds and show the final state of both traffic lights. \ No newline at end of file diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000002/final_frame.png b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..9455f0956d6a98b8ffc468c6f4d5c9005cd1f46f Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/final_frame.png differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000002/first_frame.png b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..e316855ac5ed9d7cd6ad716bebed78eaa3153137 Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/first_frame.png differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000002/ground_truth.mp4 b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..923170c4e4e240ecce21f7ec5c69fd6c76b5815f Binary files /dev/null and b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/ground_truth.mp4 differ diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000002/metadata.json b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9ae890e2066da2d9cf173fbeb92a550b5adb7921 --- /dev/null +++ b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/metadata.json @@ -0,0 +1,64 @@ +{ + "task_id": "traffic_light_00000002", + "generator": "traffic_light", + "timestamp": "2026-02-27T07:55:30.842924", + "parameters": { + "task_type": 2, + "time_elapsed": 3, + "num_active_lights": 3, + "active_directions": [ + "south", + "west", + "east" + ], + "enable_yellow_light": true, + "objects": [ + { + "symbol": "light_north", + "direction": "north", + "initial_state": null, + "initial_countdown": 0, + "final_state": null, + "final_countdown": 0, + "is_active": false + }, + { + "symbol": "light_south", + "direction": "south", + "initial_state": "yellow", + "initial_countdown": 3, + "final_state": "red", + "final_countdown": 4, + "is_active": true + }, + { + "symbol": "light_east", + "direction": "east", + "initial_state": "yellow", + "initial_countdown": 1, + "final_state": "red", + "final_countdown": 2, + "is_active": true + }, + { + "symbol": "light_west", + "direction": "west", + "initial_state": "green", + "initial_countdown": 3, + "final_state": "yellow", + "final_countdown": 4, + "is_active": true + } + ] + }, + "param_hash": "662c1e17ef2ddcc3", + "generation": { + "seed": 2026, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/traffic_light_task/traffic_light_00000002/prompt.txt b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..57ef50cea74cfb327a2f36626e3f0704861b52fe --- /dev/null +++ b/VBVR-Dataset/traffic_light_task/traffic_light_00000002/prompt.txt @@ -0,0 +1 @@ +This scene shows a crossroad with three traffic lights (South, West, East). Each light independently follows a 3-color cycle: Red (4s) → Yellow (4s) → Green (4s) → Yellow (4s) → Red. Currently: South light is yellow with 3s countdown, West light is green with 3s countdown, East light is yellow with 1s countdown. Simulate 3 seconds and show the final state of all three traffic lights. \ No newline at end of file diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/final_frame.png b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..0d76f04d5c81849b7de4150d412d632dae7019d3 Binary files /dev/null and b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/final_frame.png differ diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/first_frame.png b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..90d3f008da39658354828ab4a5746bbc84060ad0 Binary files /dev/null and b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/first_frame.png differ diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/ground_truth.mp4 b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4d165fc93f756b9ad5a49d70f5c7070ac2c24a7d --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6fdedf82519c55ce174e5c47d06820c0b715fe754f6f9caa05f7a1475f2963f +size 280425 diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/metadata.json b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..59c36813019f22b48ced8c219dd0b9309c50d3e4 --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/metadata.json @@ -0,0 +1,57 @@ +{ + "task_id": "understand_scene_structure_00000000", + "generator": "understand_scene_structure", + "timestamp": "2026-02-17T07:27:39.268563", + "parameters": { + "rooms": [ + { + "rect": [ + 60, + 60, + 331.304908, + 536.689717 + ], + "type": "kitchen" + }, + { + "rect": [ + 331.304908, + 60, + 964, + 536.689717 + ], + "type": "living" + }, + { + "rect": [ + 60, + 536.689717, + 331.304908, + 964 + ], + "type": "bedroom" + }, + { + "rect": [ + 331.304908, + 536.689717, + 964, + 964 + ], + "type": "kitchen" + } + ], + "target_index": 2, + "target_type": "bedroom" + }, + "param_hash": "a7dcd7646c539f4a", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/prompt.txt b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4394e4d3a631f35622f09c191bb681c1d819692 --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a floorplan with multiple rooms. Identify the bedroom and draw a green rectangular box around it to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/final_frame.png b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8151b2f46a86d1de93636a6e0a881bca27f0c817 Binary files /dev/null and b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/final_frame.png differ diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/first_frame.png b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..95da8d7a7a66a0e9778b7af3c3c5640848a41fbd Binary files /dev/null and b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/first_frame.png differ diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/ground_truth.mp4 b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..75648760b0745ee9d9e6f70ffd2b4680f251f900 --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8098e743c8d26bd8b7b95f938bea241d85daf05c4896c8e4158e88d67f5a14bd +size 302191 diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/metadata.json b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..adba301df6d50784b22820331ea352af8ebfc84e --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/metadata.json @@ -0,0 +1,75 @@ +{ + "task_id": "understand_scene_structure_00000001", + "generator": "understand_scene_structure", + "timestamp": "2026-02-17T07:27:39.684116", + "parameters": { + "rooms": [ + { + "rect": [ + 60, + 60, + 566.440023, + 301.69882 + ], + "type": "bathroom" + }, + { + "rect": [ + 566.440023, + 60, + 964, + 301.69882 + ], + "type": "bathroom" + }, + { + "rect": [ + 60, + 301.69882, + 566.440023, + 633.168309 + ], + "type": "bathroom" + }, + { + "rect": [ + 566.440023, + 301.69882, + 964, + 633.168309 + ], + "type": "bathroom" + }, + { + "rect": [ + 60, + 633.168309, + 566.440023, + 964 + ], + "type": "storage" + }, + { + "rect": [ + 566.440023, + 633.168309, + 964, + 964 + ], + "type": "living" + } + ], + "target_index": 5, + "target_type": "living" + }, + "param_hash": "f8366d16781d0565", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/prompt.txt b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..27d6398a04126478215675ecbf1611f788bd37c5 --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a floorplan with multiple rooms. Identify the living room and draw a green rectangular box around it to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/final_frame.png b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..11b7223231b9ba7186a3e3512a66a9988970efc3 Binary files /dev/null and b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/final_frame.png differ diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/first_frame.png b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..8c881fd1c722f84cbdd4ae2fff36ac4b8f91a39c Binary files /dev/null and b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/first_frame.png differ diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/ground_truth.mp4 b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..127804f309716fc64bc7e7d332953d0aedfd9cc5 --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62fb073d09903831ccef10f84fb0a6a0aebb1030a5f759146660db2660ae7784 +size 280169 diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/metadata.json b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..98401166e171b340662f6c44a199cd9a4d24c6db --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/metadata.json @@ -0,0 +1,57 @@ +{ + "task_id": "understand_scene_structure_00000002", + "generator": "understand_scene_structure", + "timestamp": "2026-02-17T07:27:40.093826", + "parameters": { + "rooms": [ + { + "rect": [ + 60, + 60, + 605.093466, + 662.838152 + ], + "type": "kitchen" + }, + { + "rect": [ + 605.093466, + 60, + 964, + 662.838152 + ], + "type": "living" + }, + { + "rect": [ + 60, + 662.838152, + 605.093466, + 964 + ], + "type": "living" + }, + { + "rect": [ + 605.093466, + 662.838152, + 964, + 964 + ], + "type": "bedroom" + } + ], + "target_index": 3, + "target_type": "bedroom" + }, + "param_hash": "358e22ea9b7cc67f", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/prompt.txt b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..d4394e4d3a631f35622f09c191bb681c1d819692 --- /dev/null +++ b/VBVR-Dataset/understand_scene_structure_task/understand_scene_structure_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a floorplan with multiple rooms. Identify the bedroom and draw a green rectangular box around it to highlight it. \ No newline at end of file diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/final_frame.png b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..4fd933d81d4c9b91f75b499cff0e19de99c41da4 Binary files /dev/null and b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/final_frame.png differ diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/first_frame.png b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..3f82cdcfd241cd66870fd6f59decc6ef7692f386 Binary files /dev/null and b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/first_frame.png differ diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/ground_truth.mp4 b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..88b393dc5584723fda93924a2cf5d90ba1c58352 --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63126c3dbd905658d320a84cfe5890c95e0c2a556cdc896a4f1651e62cb410da +size 398937 diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/metadata.json b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..ffe5725f8643feb8f50efd38c938e93b6d2590db --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/metadata.json @@ -0,0 +1,69 @@ +{ + "task_id": "undirected_graph_navigation_00000000", + "generator": "undirected_graph_navigation", + "timestamp": "2026-02-17T07:21:34.354115", + "parameters": { + "nodes": { + "0": [ + 875, + 669 + ], + "1": [ + 218, + 195 + ], + "2": [ + 575, + 482 + ], + "3": [ + 293, + 523 + ], + "4": [ + 232, + 773 + ] + }, + "edges": { + "0": [ + 1 + ], + "1": [ + 0, + 2 + ], + "2": [ + 1, + 3 + ], + "3": [ + 2, + 4 + ], + "4": [ + 3 + ] + }, + "start_node": 0, + "end_node": 4, + "path": [ + 0, + 1, + 2, + 3, + 4 + ], + "num_nodes": 5 + }, + "param_hash": "2ab0f92aa5a8ddc8", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/prompt.txt b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a43835bf76e15a2903ebaaf9664fd5b741a7bcc --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows a network of nodes connected by undirected edges (edges without arrows) with a green starting node, a red ending node, and a purple triangular agent positioned at the green starting node. The agent can move along any edge, traversing it from one end to the other in either direction, moving from one node to an adjacent node each step. Move the purple triangular agent from the green starting node to the red ending node along the path with the minimum number of steps. \ No newline at end of file diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/final_frame.png b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..ae9c26d681cfc7ff2311106596d1adc43dfabac7 Binary files /dev/null and b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/final_frame.png differ diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/first_frame.png b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..c54d0355cbae9f82a06114626c239abeb321f158 Binary files /dev/null and b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/first_frame.png differ diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/ground_truth.mp4 b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..79232b1f051846a248eeba7c0f9a0d90d0791744 --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de0292d5963e14cfde22b12f187425027e0c8f95249af98831abfe433a32c9d +size 342116 diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/metadata.json b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..746ce8b5caf17ae055826a426ee981fa0104ffc1 --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/metadata.json @@ -0,0 +1,83 @@ +{ + "task_id": "undirected_graph_navigation_00000001", + "generator": "undirected_graph_navigation", + "timestamp": "2026-02-17T07:21:34.813237", + "parameters": { + "nodes": { + "0": [ + 398, + 741 + ], + "1": [ + 124, + 253 + ], + "2": [ + 783, + 717 + ], + "3": [ + 477, + 193 + ], + "4": [ + 763, + 268 + ], + "5": [ + 482, + 458 + ] + }, + "edges": { + "0": [ + 1, + 2, + 4 + ], + "1": [ + 0, + 2 + ], + "2": [ + 1, + 3, + 5, + 4, + 0 + ], + "3": [ + 2, + 4 + ], + "4": [ + 3, + 5, + 2, + 0 + ], + "5": [ + 4, + 2 + ] + }, + "start_node": 0, + "end_node": 5, + "path": [ + 0, + 2, + 5 + ], + "num_nodes": 6 + }, + "param_hash": "b8d6513698bab833", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/prompt.txt b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a43835bf76e15a2903ebaaf9664fd5b741a7bcc --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows a network of nodes connected by undirected edges (edges without arrows) with a green starting node, a red ending node, and a purple triangular agent positioned at the green starting node. The agent can move along any edge, traversing it from one end to the other in either direction, moving from one node to an adjacent node each step. Move the purple triangular agent from the green starting node to the red ending node along the path with the minimum number of steps. \ No newline at end of file diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/final_frame.png b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..772ab7fb1613f5fa4e325b11ccbaa9bcc41e9509 Binary files /dev/null and b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/final_frame.png differ diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/first_frame.png b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d3dcb0bc71409b7900081fa2358c403631ac6bd3 Binary files /dev/null and b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/first_frame.png differ diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/ground_truth.mp4 b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..4356b18662b6c7c65a0ef8fadf7a0a8a8a7e1178 --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32553dec67aaa1c6e9133f261076ec164a12543460f542b33b1c8650753463d8 +size 151657 diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/metadata.json b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..0dd19a2ff65f2de3091b1535e6589faa1e601913 --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/metadata.json @@ -0,0 +1,62 @@ +{ + "task_id": "undirected_graph_navigation_00000002", + "generator": "undirected_graph_navigation", + "timestamp": "2026-02-17T07:21:35.092555", + "parameters": { + "nodes": { + "0": [ + 618, + 341 + ], + "1": [ + 434, + 842 + ], + "2": [ + 342, + 514 + ], + "3": [ + 838, + 465 + ] + }, + "edges": { + "0": [ + 1, + 3 + ], + "1": [ + 0, + 2, + 3 + ], + "2": [ + 1, + 3 + ], + "3": [ + 2, + 1, + 0 + ] + }, + "start_node": 0, + "end_node": 3, + "path": [ + 0, + 3 + ], + "num_nodes": 4 + }, + "param_hash": "1a407dda07a734e4", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/prompt.txt b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a43835bf76e15a2903ebaaf9664fd5b741a7bcc --- /dev/null +++ b/VBVR-Dataset/undirected_graph_navigation_task/undirected_graph_navigation_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows a network of nodes connected by undirected edges (edges without arrows) with a green starting node, a red ending node, and a purple triangular agent positioned at the green starting node. The agent can move along any edge, traversing it from one end to the other in either direction, moving from one node to an adjacent node each step. Move the purple triangular agent from the green starting node to the red ending node along the path with the minimum number of steps. \ No newline at end of file diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/final_frame.png b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f1465a6f490af24829f179e3a15c91f76b3084f8 Binary files /dev/null and b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/final_frame.png differ diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/first_frame.png b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..a8c6a063acf499f4ef4fbd2e60727cddb94f5915 Binary files /dev/null and b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/first_frame.png differ diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/ground_truth.mp4 b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..3dac0fe45a42b5d0bc2397cf7735af60b11c0fb8 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634354f58cceba8f25ea972d1ee7d09378a573c4a5a9e65b32a57f509c3dbbad +size 170424 diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/metadata.json b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..d0d16f62990fb2d0e6b6d4984e79d870584a3b25 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/metadata.json @@ -0,0 +1,74 @@ +{ + "task_id": "visual_jenga_00000000", + "generator": "visual_jenga", + "timestamp": "2026-02-17T07:22:08.839770", + "parameters": { + "number": 3, + "blocks": [ + { + "width": 146, + "height": 146, + "color": [ + 249, + 238, + 187 + ], + "initial_position": [ + 512, + 366 + ], + "final_position": [ + 512, + 1170 + ], + "order": 1 + }, + { + "width": 146, + "height": 146, + "color": [ + 74, + 68, + 220 + ], + "initial_position": [ + 512, + 512 + ], + "final_position": [ + 1170, + 512 + ], + "order": 2 + }, + { + "width": 146, + "height": 146, + "color": [ + 192, + 215, + 134 + ], + "initial_position": [ + 512, + 658 + ], + "final_position": [ + 512, + -146 + ], + "order": 3 + } + ] + }, + "param_hash": "1d62daae407d3293", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/prompt.txt b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe4059f5f68e9d32e3333e50bb553bc41d5df619 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000000/prompt.txt @@ -0,0 +1 @@ +The scene shows objects stacked vertically. Extract the objects one by one from top to bottom in order, moving each object out of the frame before extracting the next one. Continue until all objects have been removed from the frame. \ No newline at end of file diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/final_frame.png b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f1465a6f490af24829f179e3a15c91f76b3084f8 Binary files /dev/null and b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/final_frame.png differ diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/first_frame.png b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..d5ab67545f45c1616c5fe67032ca32d76bffeeec Binary files /dev/null and b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/first_frame.png differ diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/ground_truth.mp4 b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..62c4835a38b6f037f9899ae87fbce83a02ad6119 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d856779a9ce10330e2456d3348c3732e312f47e904d4468c5ea2f6938a7c67 +size 290579 diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/metadata.json b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..a487b1987a33009a4a8f67e209d834e402464223 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/metadata.json @@ -0,0 +1,110 @@ +{ + "task_id": "visual_jenga_00000001", + "generator": "visual_jenga", + "timestamp": "2026-02-17T07:22:09.808156", + "parameters": { + "number": 5, + "blocks": [ + { + "width": 258, + "height": 146, + "color": [ + 210, + 178, + 207 + ], + "initial_position": [ + 512, + 220 + ], + "final_position": [ + 512, + -258 + ], + "order": 1 + }, + { + "width": 146, + "height": 146, + "color": [ + 85, + 130, + 119 + ], + "initial_position": [ + 512, + 366 + ], + "final_position": [ + 512, + 1170 + ], + "order": 2 + }, + { + "width": 146, + "height": 146, + "color": [ + 205, + 51, + 83 + ], + "initial_position": [ + 512, + 512 + ], + "final_position": [ + 1170, + 512 + ], + "order": 3 + }, + { + "width": 146, + "height": 146, + "color": [ + 56, + 76, + 159 + ], + "initial_position": [ + 512, + 658 + ], + "final_position": [ + -146, + 512 + ], + "order": 4 + }, + { + "width": 272, + "height": 146, + "color": [ + 217, + 88, + 62 + ], + "initial_position": [ + 512, + 804 + ], + "final_position": [ + 512, + -272 + ], + "order": 5 + } + ] + }, + "param_hash": "227488fd1f308519", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/prompt.txt b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe4059f5f68e9d32e3333e50bb553bc41d5df619 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000001/prompt.txt @@ -0,0 +1 @@ +The scene shows objects stacked vertically. Extract the objects one by one from top to bottom in order, moving each object out of the frame before extracting the next one. Continue until all objects have been removed from the frame. \ No newline at end of file diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/final_frame.png b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/final_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..f1465a6f490af24829f179e3a15c91f76b3084f8 Binary files /dev/null and b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/final_frame.png differ diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/first_frame.png b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/first_frame.png new file mode 100644 index 0000000000000000000000000000000000000000..81e8e3d60c22d23035dee6a97b154b29231ecab0 Binary files /dev/null and b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/first_frame.png differ diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/ground_truth.mp4 b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/ground_truth.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..e195687800c570d18f38cc108e3aec9bf100235e --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/ground_truth.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accf56c02ef1eac1ee00af34779a0a2e8abef88f17d71ee7c2669156d2738a40 +size 226065 diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/metadata.json b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..388d8c05d2dcee661a5ef3d4ba578a2e2a15aa89 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/metadata.json @@ -0,0 +1,92 @@ +{ + "task_id": "visual_jenga_00000002", + "generator": "visual_jenga", + "timestamp": "2026-02-17T07:22:10.661893", + "parameters": { + "number": 4, + "blocks": [ + { + "width": 146, + "height": 146, + "color": [ + 134, + 184, + 143 + ], + "initial_position": [ + 512, + 293 + ], + "final_position": [ + 512, + -146 + ], + "order": 1 + }, + { + "width": 146, + "height": 146, + "color": [ + 157, + 233, + 231 + ], + "initial_position": [ + 512, + 439 + ], + "final_position": [ + 512, + -146 + ], + "order": 2 + }, + { + "width": 146, + "height": 146, + "color": [ + 145, + 225, + 162 + ], + "initial_position": [ + 512, + 585 + ], + "final_position": [ + 512, + -146 + ], + "order": 3 + }, + { + "width": 146, + "height": 146, + "color": [ + 198, + 207, + 217 + ], + "initial_position": [ + 512, + 731 + ], + "final_position": [ + 512, + -146 + ], + "order": 4 + } + ] + }, + "param_hash": "e32c159e34b536ab", + "generation": { + "seed": 1965760370, + "git": { + "commit": "", + "branch": "", + "repo": "", + "is_dirty": false + } + } +} \ No newline at end of file diff --git a/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/prompt.txt b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/prompt.txt new file mode 100644 index 0000000000000000000000000000000000000000..fe4059f5f68e9d32e3333e50bb553bc41d5df619 --- /dev/null +++ b/VBVR-Dataset/visual_jenga_task/visual_jenga_00000002/prompt.txt @@ -0,0 +1 @@ +The scene shows objects stacked vertically. Extract the objects one by one from top to bottom in order, moving each object out of the frame before extracting the next one. Continue until all objects have been removed from the frame. \ No newline at end of file