| { | |
| "dataset_kwargs": { | |
| "balance_weights": false, | |
| "batch_size": 8, | |
| "dataset_kwargs_list": [ | |
| { | |
| "name": "kuka", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "kuka_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "taco_play", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "rgb_static", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "taco_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "taco_extra", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "rgb_static", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "taco_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "jaco_play", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "jaco_play_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "berkeley_cable_routing", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "berkeley_cable_routing_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "roboturk", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "front_rgb", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "roboturk_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "viola", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "agentview_rgb", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "viola_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "berkeley_autolab_ur5", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "berkeley_autolab_ur5_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "toto", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "toto_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "language_table", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "rgb", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "language_table_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "stanford_hydra_dataset_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "stanford_hydra_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "austin_buds_dataset_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "austin_buds_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "nyu_franka_play_dataset_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "nyu_franka_play_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "furniture_bench_dataset_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "furniture_bench_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "austin_sailor_dataset_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "nav": null, | |
| "high": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "austin_sailor_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "austin_sirius_dataset_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "nav": null, | |
| "high": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "austin_sirius_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "bc_z", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "bc_z_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "dlr_edan_shared_control_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "dlr_edan_shared_control_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "iamlab_cmu_pickup_insert_converted_externally_to_rlds", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "iamlab_pick_insert_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "utaustin_mutex", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "utaustin_mutex_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "berkeley_fanuc_manipulation", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "berkeley_fanuc_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "cmu_stretch", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "cmu_stretch_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "droid", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "exterior_image_1_left", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "filter_functions": [ | |
| { | |
| "module": "experiments.homer.scripts.configs.cross_embodiment", | |
| "name": "filter_success", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| ], | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "droid_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_pen_uncap_diverse_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_pen_uncap_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_dough_cut_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_dough_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_lucy_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_dough_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_drawer_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_dough_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_pick_place_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_dough_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_static_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_dough_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "aloha_sushi_cut_full_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": "cam_high", | |
| "nav": null, | |
| "left_wrist": "cam_left_wrist", | |
| "right_wrist": "cam_right_wrist" | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": "proprio", | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "aloha_dough_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "bridge_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image_0", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "bridge_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "go1", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": "proprio" | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "go1_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "droid_wipe", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "exterior_image_2_left", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "droid_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "omnimimic_gnm_dataset", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": null, | |
| "high": null, | |
| "nav": "image", | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "omnimimic_gnm_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| }, | |
| { | |
| "name": "fractal20220817_data", | |
| "data_dir": null, | |
| "image_obs_keys": { | |
| "primary": "image", | |
| "high": null, | |
| "nav": null, | |
| "left_wrist": null, | |
| "right_wrist": null | |
| }, | |
| "proprio_obs_keys": { | |
| "bimanual": null, | |
| "quadruped": null | |
| }, | |
| "proprio_obs_dims": { | |
| "bimanual": 14, | |
| "quadruped": 59 | |
| }, | |
| "action_normalization_mask": [ | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| true, | |
| false | |
| ], | |
| "language_key": "language_instruction", | |
| "action_proprio_normalization_type": "normal", | |
| "standardize_fn": { | |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", | |
| "name": "rt1_dataset_transform", | |
| "args": [], | |
| "kwargs": {} | |
| } | |
| } | |
| ], | |
| "frame_transform_kwargs": { | |
| "image_augment_kwargs": { | |
| "high": { | |
| "augment_order": [ | |
| "random_resized_crop", | |
| "random_brightness", | |
| "random_contrast", | |
| "random_saturation", | |
| "random_hue" | |
| ], | |
| "random_brightness": [ | |
| 0.1 | |
| ], | |
| "random_contrast": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "random_hue": [ | |
| 0.05 | |
| ], | |
| "random_resized_crop": { | |
| "ratio": [ | |
| 0.75, | |
| 1.3333333333333333 | |
| ], | |
| "scale": [ | |
| 0.9, | |
| 1.0 | |
| ] | |
| }, | |
| "random_saturation": [ | |
| 0.9, | |
| 1.1 | |
| ] | |
| }, | |
| "left_wrist": { | |
| "augment_order": [ | |
| "random_resized_crop", | |
| "random_brightness", | |
| "random_contrast", | |
| "random_saturation", | |
| "random_hue" | |
| ], | |
| "random_brightness": [ | |
| 0.1 | |
| ], | |
| "random_contrast": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "random_hue": [ | |
| 0.05 | |
| ], | |
| "random_resized_crop": { | |
| "ratio": [ | |
| 0.75, | |
| 1.3333333333333333 | |
| ], | |
| "scale": [ | |
| 0.9, | |
| 1.0 | |
| ] | |
| }, | |
| "random_saturation": [ | |
| 0.9, | |
| 1.1 | |
| ] | |
| }, | |
| "nav": { | |
| "augment_order": [ | |
| "random_resized_crop", | |
| "random_brightness", | |
| "random_contrast", | |
| "random_saturation", | |
| "random_hue" | |
| ], | |
| "random_brightness": [ | |
| 0.1 | |
| ], | |
| "random_contrast": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "random_hue": [ | |
| 0.05 | |
| ], | |
| "random_resized_crop": { | |
| "ratio": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "scale": [ | |
| 0.8, | |
| 1.0 | |
| ] | |
| }, | |
| "random_saturation": [ | |
| 0.9, | |
| 1.1 | |
| ] | |
| }, | |
| "primary": { | |
| "augment_order": [ | |
| "random_resized_crop", | |
| "random_brightness", | |
| "random_contrast", | |
| "random_saturation", | |
| "random_hue" | |
| ], | |
| "random_brightness": [ | |
| 0.1 | |
| ], | |
| "random_contrast": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "random_hue": [ | |
| 0.05 | |
| ], | |
| "random_resized_crop": { | |
| "ratio": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "scale": [ | |
| 0.8, | |
| 1.0 | |
| ] | |
| }, | |
| "random_saturation": [ | |
| 0.9, | |
| 1.1 | |
| ] | |
| }, | |
| "right_wrist": { | |
| "augment_order": [ | |
| "random_resized_crop", | |
| "random_brightness", | |
| "random_contrast", | |
| "random_saturation", | |
| "random_hue" | |
| ], | |
| "random_brightness": [ | |
| 0.1 | |
| ], | |
| "random_contrast": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "random_hue": [ | |
| 0.05 | |
| ], | |
| "random_resized_crop": { | |
| "ratio": [ | |
| 0.75, | |
| 1.3333333333333333 | |
| ], | |
| "scale": [ | |
| 0.9, | |
| 1.0 | |
| ] | |
| }, | |
| "random_saturation": [ | |
| 0.9, | |
| 1.1 | |
| ] | |
| } | |
| }, | |
| "num_parallel_calls": 200, | |
| "resize_size": { | |
| "high": [ | |
| 224, | |
| 224 | |
| ], | |
| "left_wrist": [ | |
| 224, | |
| 224 | |
| ], | |
| "nav": [ | |
| 224, | |
| 224 | |
| ], | |
| "primary": [ | |
| 224, | |
| 224 | |
| ], | |
| "right_wrist": [ | |
| 224, | |
| 224 | |
| ] | |
| } | |
| }, | |
| "sample_weights": [ | |
| 0.021755552811740044, | |
| 0.009986998241552502, | |
| 0.0023179438302583103, | |
| 0.0016371801232614254, | |
| 0.0008888419195460733, | |
| 0.007874885740329124, | |
| 0.0032054418194781, | |
| 0.004113224757060238, | |
| 0.006839324427193265, | |
| 0.01479473259297815, | |
| 0.015045048015813084, | |
| 0.0007163148639093663, | |
| 0.002826978440249719, | |
| 0.008290489894059044, | |
| 0.007414589603576858, | |
| 0.005878414243900214, | |
| 0.021755552811740044, | |
| 0.0001874782805166165, | |
| 0.0030709017944702635, | |
| 0.007599149035416076, | |
| 0.0026296096724881066, | |
| 0.0005253087662862543, | |
| 0.0002175555281174004, | |
| 0.085, | |
| 0.014166666666666666, | |
| 0.014166666666666666, | |
| 0.014166666666666666, | |
| 0.014166666666666666, | |
| 0.014166666666666666, | |
| 0.014166666666666666, | |
| 0.17, | |
| 0.085, | |
| 0.085, | |
| 0.17, | |
| 0.17 | |
| ], | |
| "shuffle_buffer_size": 25000, | |
| "traj_read_threads": 48, | |
| "traj_transform_kwargs": { | |
| "action_horizon": 100, | |
| "goal_relabeling_kwargs": { | |
| "max_goal_distance": 15 | |
| }, | |
| "goal_relabeling_strategy": "uniform", | |
| "head_to_dataset": { | |
| "bimanual": [ | |
| "aloha_pen_uncap_diverse_dataset", | |
| "aloha_dough_cut_dataset", | |
| "aloha_lucy_dataset", | |
| "aloha_drawer_dataset", | |
| "aloha_pick_place_dataset", | |
| "aloha_static_dataset", | |
| "aloha_sushi_cut_full_dataset" | |
| ], | |
| "nav": [ | |
| "omnimimic_gnm_dataset" | |
| ], | |
| "quadruped": [ | |
| "go1" | |
| ], | |
| "single_arm": [ | |
| "bridge_dataset", | |
| "fractal20220817_data", | |
| "kuka", | |
| "taco_play", | |
| "taco_extra", | |
| "jaco_play", | |
| "berkeley_cable_routing", | |
| "roboturk", | |
| "nyu_door_opening_surprising_effectiveness", | |
| "viola", | |
| "berkeley_autolab_ur5", | |
| "toto", | |
| "language_table", | |
| "stanford_hydra_dataset_converted_externally_to_rlds", | |
| "austin_buds_dataset_converted_externally_to_rlds", | |
| "nyu_franka_play_dataset_converted_externally_to_rlds", | |
| "furniture_bench_dataset_converted_externally_to_rlds", | |
| "austin_sailor_dataset_converted_externally_to_rlds", | |
| "austin_sirius_dataset_converted_externally_to_rlds", | |
| "bc_z", | |
| "dlr_edan_shared_control_converted_externally_to_rlds", | |
| "iamlab_cmu_pickup_insert_converted_externally_to_rlds", | |
| "utaustin_mutex", | |
| "berkeley_fanuc_manipulation", | |
| "cmu_stretch", | |
| "droid", | |
| "droid_wipe" | |
| ] | |
| }, | |
| "max_action_dim": 14, | |
| "subsample_length": 100, | |
| "task_augment_kwargs": { | |
| "keep_image_prob": 1.0 | |
| }, | |
| "task_augment_strategy": "delete_task_conditioning", | |
| "window_size": 5 | |
| }, | |
| "traj_transform_threads": 48 | |
| }, | |
| "eval_datasets": [], | |
| "eval_interval": 5e+20, | |
| "log_interval": 500, | |
| "model": { | |
| "heads": { | |
| "bimanual": { | |
| "args": [], | |
| "kwargs": { | |
| "action_dim": 14, | |
| "action_horizon": 100, | |
| "clip_pred": false, | |
| "constrain_loss_dims": true, | |
| "loss_weight": 1.0, | |
| "num_preds": 14, | |
| "pool_strategy": "pass", | |
| "readout_key": "readout_bimanual" | |
| }, | |
| "module": "crossformer.model.components.action_heads", | |
| "name": "L1ActionHead" | |
| }, | |
| "nav": { | |
| "args": [], | |
| "kwargs": { | |
| "action_dim": 2, | |
| "action_horizon": 4, | |
| "clip_pred": false, | |
| "constrain_loss_dims": true, | |
| "loss_weight": 1.0, | |
| "num_preds": 2, | |
| "pool_strategy": "pass", | |
| "readout_key": "readout_nav" | |
| }, | |
| "module": "crossformer.model.components.action_heads", | |
| "name": "L1ActionHead" | |
| }, | |
| "quadruped": { | |
| "args": [], | |
| "kwargs": { | |
| "action_dim": 12, | |
| "action_horizon": 1, | |
| "clip_pred": false, | |
| "constrain_loss_dims": true, | |
| "loss_weight": 1.0, | |
| "num_preds": 12, | |
| "pool_strategy": "pass", | |
| "readout_key": "readout_quadruped" | |
| }, | |
| "module": "crossformer.model.components.action_heads", | |
| "name": "L1ActionHead" | |
| }, | |
| "single_arm": { | |
| "args": [], | |
| "kwargs": { | |
| "action_dim": 7, | |
| "action_horizon": 4, | |
| "clip_pred": false, | |
| "constrain_loss_dims": true, | |
| "loss_weight": 1.0, | |
| "num_preds": 7, | |
| "pool_strategy": "pass", | |
| "readout_key": "readout_single_arm" | |
| }, | |
| "module": "crossformer.model.components.action_heads", | |
| "name": "L1ActionHead" | |
| } | |
| }, | |
| "max_horizon": 10, | |
| "observation_tokenizers": { | |
| "bimanual": { | |
| "args": [], | |
| "kwargs": { | |
| "dropout_rate": 0.2, | |
| "obs_keys": [ | |
| "proprio_bimanual" | |
| ] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "LowdimObsTokenizer" | |
| }, | |
| "high": { | |
| "args": [], | |
| "kwargs": { | |
| "encoder": { | |
| "args": [], | |
| "kwargs": {}, | |
| "module": "crossformer.model.components.vit_encoders", | |
| "name": "ResNet26FILM" | |
| }, | |
| "obs_stack_keys": [ | |
| "image_high" | |
| ], | |
| "task_film_keys": [ | |
| "language_instruction" | |
| ], | |
| "task_stack_keys": [ | |
| "image_high" | |
| ] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "ImageTokenizer" | |
| }, | |
| "left": { | |
| "args": [], | |
| "kwargs": { | |
| "encoder": { | |
| "args": [], | |
| "kwargs": {}, | |
| "module": "crossformer.model.components.vit_encoders", | |
| "name": "ResNet26FILM" | |
| }, | |
| "obs_stack_keys": [ | |
| "image_left_wrist" | |
| ], | |
| "task_film_keys": [ | |
| "language_instruction" | |
| ], | |
| "task_stack_keys": [] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "ImageTokenizer" | |
| }, | |
| "nav": { | |
| "args": [], | |
| "kwargs": { | |
| "encoder": { | |
| "args": [], | |
| "kwargs": {}, | |
| "module": "crossformer.model.components.vit_encoders", | |
| "name": "ResNet26" | |
| }, | |
| "obs_stack_keys": [ | |
| "image_nav" | |
| ], | |
| "task_film_keys": [], | |
| "task_stack_keys": [ | |
| "image_nav" | |
| ] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "ImageTokenizer" | |
| }, | |
| "primary": { | |
| "args": [], | |
| "kwargs": { | |
| "encoder": { | |
| "args": [], | |
| "kwargs": {}, | |
| "module": "crossformer.model.components.vit_encoders", | |
| "name": "ResNet26FILM" | |
| }, | |
| "obs_stack_keys": [ | |
| "image_primary" | |
| ], | |
| "task_film_keys": [ | |
| "language_instruction" | |
| ], | |
| "task_stack_keys": [ | |
| "image_primary" | |
| ] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "ImageTokenizer" | |
| }, | |
| "quadruped": { | |
| "args": [], | |
| "kwargs": { | |
| "obs_keys": [ | |
| "proprio_quadruped" | |
| ] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "LowdimObsTokenizer" | |
| }, | |
| "right": { | |
| "args": [], | |
| "kwargs": { | |
| "encoder": { | |
| "args": [], | |
| "kwargs": {}, | |
| "module": "crossformer.model.components.vit_encoders", | |
| "name": "ResNet26FILM" | |
| }, | |
| "obs_stack_keys": [ | |
| "image_right_wrist" | |
| ], | |
| "task_film_keys": [ | |
| "language_instruction" | |
| ], | |
| "task_stack_keys": [] | |
| }, | |
| "module": "crossformer.model.components.tokenizers", | |
| "name": "ImageTokenizer" | |
| } | |
| }, | |
| "readouts": { | |
| "bimanual": 100, | |
| "nav": 4, | |
| "quadruped": 1, | |
| "single_arm": 4 | |
| }, | |
| "repeat_task_tokens": true, | |
| "task_tokenizers": {}, | |
| "token_embedding_size": 512, | |
| "transformer_kwargs": { | |
| "attention_dropout_rate": 0.0, | |
| "dropout_rate": 0.1, | |
| "mlp_dim": 2048, | |
| "num_attention_heads": 8, | |
| "num_layers": 12, | |
| "repeat_pos_enc": true | |
| } | |
| }, | |
| "num_steps": 300000, | |
| "optimizer": { | |
| "clip_gradient": 1.0, | |
| "frozen_keys": [], | |
| "learning_rate": { | |
| "init_value": 0.0, | |
| "name": "rsqrt", | |
| "peak_value": 0.0003, | |
| "timescale": 10000, | |
| "warmup_steps": 2000 | |
| }, | |
| "weight_decay": 0.1 | |
| }, | |
| "prefetch_num_batches": 0, | |
| "pretrained_loaders": [ | |
| { | |
| "module": "experiments.sudeep.aloha.resnet_pt", | |
| "name": "resnet_26_loader", | |
| "args": [], | |
| "kwargs": { | |
| "restore_path": "" | |
| } | |
| } | |
| ], | |
| "resume_path": null, | |
| "save_dir": null, | |
| "save_interval": 10000, | |
| "seed": 42, | |
| "skip_norm_keys": [ | |
| "proprio_bimanual" | |
| ], | |
| "start_step": null, | |
| "text_processor": { | |
| "args": [], | |
| "kwargs": {}, | |
| "module": "crossformer.data.utils.text_processing", | |
| "name": "UniversalSentenceEncoder" | |
| }, | |
| "val_kwargs": { | |
| "num_val_batches": 16, | |
| "val_shuffle_buffer_size": 1000 | |
| }, | |
| "viz_datasets": [], | |
| "viz_interval": 5e+20, | |
| "viz_kwargs": { | |
| "eval_batch_size": 128, | |
| "samples_per_state": 8, | |
| "trajs_for_metrics": 100, | |
| "trajs_for_viz": 8 | |
| }, | |
| "wandb": { | |
| "entity": null, | |
| "group": null, | |
| "project": "crossformer" | |
| }, | |
| "wandb_resume_id": null, | |
| "window_size": 5 | |
| } |