| { | |
| "processor_class": "Gr00tN1d6Processor", | |
| "processor_kwargs": { | |
| "modality_configs": { | |
| "behavior_r1_pro": { | |
| "video": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "observation.images.rgb.head_256_256", | |
| "observation.images.rgb.left_wrist_256_256", | |
| "observation.images.rgb.right_wrist_256_256" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "robot_pos", | |
| "robot_ori_cos", | |
| "robot_ori_sin", | |
| "robot_2d_ori", | |
| "robot_2d_ori_cos", | |
| "robot_2d_ori_sin", | |
| "robot_lin_vel", | |
| "robot_ang_vel", | |
| "arm_left_qpos", | |
| "arm_left_qpos_sin", | |
| "arm_left_qpos_cos", | |
| "eef_left_pos", | |
| "eef_left_quat", | |
| "gripper_left_qpos", | |
| "arm_right_qpos", | |
| "arm_right_qpos_sin", | |
| "arm_right_qpos_cos", | |
| "eef_right_pos", | |
| "eef_right_quat", | |
| "gripper_right_qpos", | |
| "trunk_qpos" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15, | |
| 16, | |
| 17, | |
| 18, | |
| 19, | |
| 20, | |
| 21, | |
| 22, | |
| 23, | |
| 24, | |
| 25, | |
| 26, | |
| 27, | |
| 28, | |
| 29, | |
| 30, | |
| 31 | |
| ], | |
| "modality_keys": [ | |
| "base", | |
| "torso", | |
| "left_arm", | |
| "left_gripper", | |
| "right_arm", | |
| "right_gripper" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": "trunk_qpos" | |
| }, | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": "arm_left_qpos" | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": "arm_right_qpos" | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.coarse_action" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "gr1": { | |
| "video": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "ego_view_bg_crop_pad_res256_freq20" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "right_arm", | |
| "left_hand", | |
| "right_hand", | |
| "waist" | |
| ], | |
| "sin_cos_embedding_keys": [ | |
| "left_arm", | |
| "right_arm", | |
| "left_hand", | |
| "right_hand", | |
| "waist" | |
| ], | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "right_arm", | |
| "left_hand", | |
| "right_hand", | |
| "waist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "RELATIVE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "task" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "rl_info": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "robocasa_panda_omron": { | |
| "video": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "res256_image_side_0", | |
| "res256_image_side_1", | |
| "res256_image_wrist_0" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position_relative", | |
| "end_effector_rotation_relative", | |
| "gripper_qpos", | |
| "base_position", | |
| "base_rotation" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close", | |
| "base_motion", | |
| "control_mode" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| } | |
| }, | |
| "image_crop_size": null, | |
| "image_target_size": null, | |
| "use_albumentations": true, | |
| "random_rotation_angle": null, | |
| "color_jitter_params": { | |
| "brightness": 0.3, | |
| "contrast": 0.4, | |
| "saturation": 0.5, | |
| "hue": 0.08 | |
| }, | |
| "shortest_image_edge": 256, | |
| "crop_fraction": 0.95, | |
| "model_name": "nvidia/Eagle-Block2A-2B-v2", | |
| "model_type": "eagle", | |
| "formalize_language": true, | |
| "max_state_dim": 128, | |
| "max_action_dim": 128, | |
| "max_action_horizon": 50, | |
| "use_percentiles": false, | |
| "clip_outliers": true, | |
| "apply_sincos_state_encoding": true, | |
| "use_relative_action": true | |
| } | |
| } |