NV-MedTech
Safetensors
Gr00tN1d6
GR00T-H / processor_config.json
nigeln's picture
Squash history into single release commit
47d8583
{
"processor_class": "Gr00tN1d6Processor",
"processor_kwargs": {
"modality_configs": {
"behavior_r1_pro": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"observation.images.rgb.head_256_256",
"observation.images.rgb.left_wrist_256_256",
"observation.images.rgb.right_wrist_256_256"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"robot_pos",
"robot_ori_cos",
"robot_ori_sin",
"robot_2d_ori",
"robot_2d_ori_cos",
"robot_2d_ori_sin",
"robot_lin_vel",
"robot_ang_vel",
"arm_left_qpos",
"arm_left_qpos_sin",
"arm_left_qpos_cos",
"eef_left_pos",
"eef_left_quat",
"gripper_left_qpos",
"arm_right_qpos",
"arm_right_qpos_sin",
"arm_right_qpos_cos",
"eef_right_pos",
"eef_right_quat",
"gripper_right_qpos",
"trunk_qpos"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31
],
"modality_keys": [
"base",
"torso",
"left_arm",
"left_gripper",
"right_arm",
"right_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": "trunk_qpos",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": "arm_left_qpos",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": "arm_right_qpos",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.human.coarse_action"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"gr1": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"ego_view_bg_crop_pad_res256_freq20"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"left_arm",
"right_arm",
"left_hand",
"right_hand",
"waist"
],
"sin_cos_embedding_keys": [
"left_arm",
"right_arm",
"left_hand",
"right_hand",
"waist"
],
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15
],
"modality_keys": [
"left_arm",
"right_arm",
"left_hand",
"right_hand",
"waist"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "RELATIVE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"robocasa_panda_omron": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"res256_image_side_0",
"res256_image_side_1",
"res256_image_wrist_0"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"end_effector_position_relative",
"end_effector_rotation_relative",
"gripper_qpos",
"base_position",
"base_rotation"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15
],
"modality_keys": [
"end_effector_position",
"end_effector_rotation",
"gripper_close",
"base_motion",
"control_mode"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.human.action.task_description"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"cmr_versius": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"left_pose",
"left_gripper",
"right_pose",
"right_gripper",
"translation_scaling",
"rotation_scaling",
"hapticengaged_left",
"hapticengaged_right"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"left_pose",
"left_gripper",
"right_pose",
"right_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": [
"translation_scaling",
"rotation_scaling",
"hapticengaged_left",
"hapticengaged_right"
],
"action_configs": null
},
"action": {
"delta_indices": [
2,
4,
6,
8,
10,
12,
14,
16,
18,
20,
22,
24,
26,
28,
30,
32,
34,
36,
38,
40,
42,
44,
46,
48,
50,
52,
54,
56,
58,
60,
62,
64,
66,
68,
70,
72,
74,
76,
78,
80,
82,
84,
86,
88,
90,
92,
94,
96,
98,
100
],
"modality_keys": [
"left_pose",
"left_gripper",
"right_pose",
"right_gripper",
"hapticengaged_left",
"hapticengaged_right"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": [
"hapticengaged_left",
"hapticengaged_right"
],
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "left_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": "translation_scaling",
"rotation_scaling_key": "rotation_scaling",
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": "left_gripper",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": true
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "right_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": "translation_scaling",
"rotation_scaling_key": "rotation_scaling",
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": "right_gripper",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": true
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "skip",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "skip",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.human.task_description"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"ucsd_dvrk": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"camera_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm_retraction_pose",
"psm_retraction_gripper",
"psm_cutter_pose",
"psm_cutter_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm_retraction_pose",
"psm_retraction_gripper",
"psm_cutter_pose",
"psm_cutter_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49,
50
],
"modality_keys": [
"psm_retraction_pose",
"psm_retraction_gripper",
"psm_cutter_pose",
"psm_cutter_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm_retraction_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "wxyz",
"reference_rotation_format": "quat",
"reference_quat_order": "wxyz",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm_cutter_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "wxyz",
"reference_rotation_format": "quat",
"reference_quat_order": "wxyz",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"jhu_imerse_dvrk": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left",
"wrist_left",
"wrist_right"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49,
50
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.human.task_description"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"obuda_dvrk": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left",
"wrist_left",
"wrist_right"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"stanford_dvrk_real": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "euler",
"input_quat_order": "xyzw",
"reference_rotation_format": "euler",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "euler",
"input_quat_order": "xyzw",
"reference_rotation_format": "euler",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"tud_tundra_ur5e": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"laparoscope_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"joint_position",
"eef_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"joint_position"
],
"min_max_embedding_keys": null,
"pass_through_keys": [
"eef_pose"
],
"action_configs": null
},
"action": {
"delta_indices": [
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49,
50
],
"modality_keys": [
"eef_pose",
"gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "eef_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"jhu_lscr_dvrk_smarts": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left",
"camera_side_view"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"jhu_imerse_dvrk_mono": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.human.task_description"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"rob_surgical_bitrack": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"left_pose",
"right_pose",
"aux_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"left_pose",
"right_pose",
"aux_pose"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"left_pose",
"right_pose",
"aux_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "left_pose",
"normalization_type": "percentile",
"input_rotation_format": "euler",
"input_quat_order": "xyzw",
"reference_rotation_format": "euler",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "right_pose",
"normalization_type": "percentile",
"input_rotation_format": "euler",
"input_quat_order": "xyzw",
"reference_rotation_format": "euler",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "aux_pose",
"normalization_type": "percentile",
"input_rotation_format": "euler",
"input_quat_order": "xyzw",
"reference_rotation_format": "euler",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.instruction"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"turin_mitic_ex_vivo": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_joints",
"psm2_joints",
"psm1_pose",
"psm2_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_joints",
"psm2_joints"
],
"min_max_embedding_keys": null,
"pass_through_keys": [
"psm1_pose",
"psm2_pose"
],
"action_configs": null
},
"action": {
"delta_indices": [
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49,
50
],
"modality_keys": [
"psm1_pose",
"psm2_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.instruction"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"ustc_torin_tuodao": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"left_joints",
"right_joints",
"left_pose",
"right_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"left_joints",
"right_joints"
],
"min_max_embedding_keys": null,
"pass_through_keys": [
"left_pose",
"right_pose"
],
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"left_pose",
"left_gripper",
"right_pose",
"right_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "left_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "right_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.instruction"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"hamlyn_dvrk_30hz": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope",
"wrist_left",
"wrist_right"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"left_arm_pose",
"left_arm_gripper",
"right_arm_pose",
"right_arm_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"left_arm_pose",
"left_arm_gripper",
"right_arm_pose",
"right_arm_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"left_arm_pose",
"left_arm_gripper",
"right_arm_pose",
"right_arm_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "left_arm_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "wxyz",
"reference_rotation_format": "quat",
"reference_quat_order": "wxyz",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "right_arm_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "wxyz",
"reference_rotation_format": "quat",
"reference_quat_order": "wxyz",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"ucb_dvrk": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"camera_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"psm1_joints",
"psm1_gripper",
"psm2_joints",
"psm2_gripper",
"psm1_pose",
"psm2_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"psm1_joints",
"psm1_gripper",
"psm2_joints",
"psm2_gripper"
],
"min_max_embedding_keys": null,
"pass_through_keys": [
"psm1_pose",
"psm2_pose"
],
"action_configs": null
},
"action": {
"delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49
],
"modality_keys": [
"psm1_pose",
"psm1_gripper",
"psm2_pose",
"psm2_gripper"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm1_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "psm2_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
},
{
"rep": "ABSOLUTE",
"type": "NON_EEF",
"format": "DEFAULT",
"state_key": null,
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "rot6d",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"task"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
},
"jhu_imerse_star_il": {
"video": {
"delta_indices": [
0
],
"modality_keys": [
"endoscope_left",
"wrist_left"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
},
"state": {
"delta_indices": [
0
],
"modality_keys": [
"kuka_joint_pos",
"endo360_joint_pos",
"kuka_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": [
"kuka_joint_pos",
"endo360_joint_pos"
],
"min_max_embedding_keys": null,
"pass_through_keys": [
"kuka_pose"
],
"action_configs": null
},
"action": {
"delta_indices": [
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49,
50
],
"modality_keys": [
"kuka_pose"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": [
{
"rep": "REL_XYZ_ROT6D",
"type": "EEF",
"format": "XYZ_ROT6D",
"state_key": "kuka_pose",
"normalization_type": "percentile",
"input_rotation_format": "quat",
"input_quat_order": "xyzw",
"reference_rotation_format": "quat",
"reference_quat_order": "xyzw",
"translation_scaling_key": null,
"rotation_scaling_key": null,
"hold_through_clutch": false
}
]
},
"language": {
"delta_indices": [
0
],
"modality_keys": [
"annotation.human.task_description"
],
"sin_cos_embedding_keys": null,
"mean_std_embedding_keys": null,
"min_max_embedding_keys": null,
"pass_through_keys": null,
"action_configs": null
}
}
},
"image_crop_size": [
224,
392
],
"image_target_size": [
236,
414
],
"use_albumentations": false,
"random_rotation_angle": 5,
"color_jitter_params": {
"brightness": 0.12,
"contrast": 0.15,
"saturation": 0.15,
"hue": 0.02
},
"shortest_image_edge": null,
"crop_fraction": null,
"model_name": "nvidia/Eagle-Block2A-2B-v2",
"model_type": "eagle",
"formalize_language": true,
"max_state_dim": 128,
"max_action_dim": 128,
"max_action_horizon": 50,
"use_percentiles": false,
"clip_outliers": true,
"apply_sincos_state_encoding": true,
"use_relative_action": true
}
}