| { |
| "processor_class": "Gr00tN1d6Processor", |
| "processor_kwargs": { |
| "modality_configs": { |
| "behavior_r1_pro": { |
| "video": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "observation.images.rgb.head_256_256", |
| "observation.images.rgb.left_wrist_256_256", |
| "observation.images.rgb.right_wrist_256_256" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "state": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "robot_pos", |
| "robot_ori_cos", |
| "robot_ori_sin", |
| "robot_2d_ori", |
| "robot_2d_ori_cos", |
| "robot_2d_ori_sin", |
| "robot_lin_vel", |
| "robot_ang_vel", |
| "arm_left_qpos", |
| "arm_left_qpos_sin", |
| "arm_left_qpos_cos", |
| "eef_left_pos", |
| "eef_left_quat", |
| "gripper_left_qpos", |
| "arm_right_qpos", |
| "arm_right_qpos_sin", |
| "arm_right_qpos_cos", |
| "eef_right_pos", |
| "eef_right_quat", |
| "gripper_right_qpos", |
| "trunk_qpos" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "action": { |
| "delta_indices": [ |
| 0, |
| 1, |
| 2, |
| 3, |
| 4, |
| 5, |
| 6, |
| 7, |
| 8, |
| 9, |
| 10, |
| 11, |
| 12, |
| 13, |
| 14, |
| 15, |
| 16, |
| 17, |
| 18, |
| 19, |
| 20, |
| 21, |
| 22, |
| 23, |
| 24, |
| 25, |
| 26, |
| 27, |
| 28, |
| 29, |
| 30, |
| 31 |
| ], |
| "modality_keys": [ |
| "base", |
| "torso", |
| "left_arm", |
| "left_gripper", |
| "right_arm", |
| "right_gripper" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": [ |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": "trunk_qpos" |
| }, |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": "arm_left_qpos" |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": "arm_right_qpos" |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| } |
| ] |
| }, |
| "language": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "annotation.human.coarse_action" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| } |
| }, |
| "gr1": { |
| "video": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "ego_view_bg_crop_pad_res256_freq20" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "state": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "left_arm", |
| "right_arm", |
| "left_hand", |
| "right_hand", |
| "waist" |
| ], |
| "sin_cos_embedding_keys": [ |
| "left_arm", |
| "right_arm", |
| "left_hand", |
| "right_hand", |
| "waist" |
| ], |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "action": { |
| "delta_indices": [ |
| 0, |
| 1, |
| 2, |
| 3, |
| 4, |
| 5, |
| 6, |
| 7, |
| 8, |
| 9, |
| 10, |
| 11, |
| 12, |
| 13, |
| 14, |
| 15 |
| ], |
| "modality_keys": [ |
| "left_arm", |
| "right_arm", |
| "left_hand", |
| "right_hand", |
| "waist" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": [ |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "RELATIVE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| } |
| ] |
| }, |
| "language": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "task" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| } |
| }, |
| "robocasa_panda_omron": { |
| "video": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "res256_image_side_0", |
| "res256_image_side_1", |
| "res256_image_wrist_0" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "state": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "end_effector_position_relative", |
| "end_effector_rotation_relative", |
| "gripper_qpos", |
| "base_position", |
| "base_rotation" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "action": { |
| "delta_indices": [ |
| 0, |
| 1, |
| 2, |
| 3, |
| 4, |
| 5, |
| 6, |
| 7, |
| 8, |
| 9, |
| 10, |
| 11, |
| 12, |
| 13, |
| 14, |
| 15 |
| ], |
| "modality_keys": [ |
| "end_effector_position", |
| "end_effector_rotation", |
| "gripper_close", |
| "base_motion", |
| "control_mode" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": [ |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| } |
| ] |
| }, |
| "language": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "annotation.human.action.task_description" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| } |
| }, |
| "new_embodiment": { |
| "video": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "cam_left_head" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "state": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "arm_left", |
| "arm_right" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| }, |
| "action": { |
| "delta_indices": [ |
| 0, |
| 1, |
| 2, |
| 3, |
| 4, |
| 5, |
| 6, |
| 7, |
| 8, |
| 9, |
| 10, |
| 11, |
| 12, |
| 13, |
| 14, |
| 15 |
| ], |
| "modality_keys": [ |
| "arm_left", |
| "arm_right" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": [ |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| }, |
| { |
| "rep": "ABSOLUTE", |
| "type": "NON_EEF", |
| "format": "DEFAULT", |
| "state_key": null |
| } |
| ] |
| }, |
| "language": { |
| "delta_indices": [ |
| 0 |
| ], |
| "modality_keys": [ |
| "annotation.human.task_description" |
| ], |
| "sin_cos_embedding_keys": null, |
| "mean_std_embedding_keys": null, |
| "action_configs": null |
| } |
| } |
| }, |
| "image_crop_size": null, |
| "image_target_size": null, |
| "use_albumentations": true, |
| "random_rotation_angle": null, |
| "color_jitter_params": { |
| "brightness": 0.3, |
| "contrast": 0.4, |
| "saturation": 0.5, |
| "hue": 0.08 |
| }, |
| "shortest_image_edge": 256, |
| "crop_fraction": 0.95, |
| "model_name": "nvidia/Eagle-Block2A-2B-v2", |
| "model_type": "eagle", |
| "formalize_language": true, |
| "max_state_dim": 128, |
| "max_action_dim": 128, |
| "max_action_horizon": 50, |
| "use_percentiles": false, |
| "clip_outliers": true, |
| "apply_sincos_state_encoding": true, |
| "use_relative_action": true |
| } |
| } |