| { |
| "dataset_kwargs": { |
| "balance_weights": false, |
| "batch_size": 8, |
| "dataset_kwargs_list": [ |
| { |
| "name": "kuka", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "kuka_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "taco_play", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "rgb_static", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "taco_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "taco_extra", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "rgb_static", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "taco_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "jaco_play", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "jaco_play_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "berkeley_cable_routing", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "berkeley_cable_routing_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "roboturk", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "front_rgb", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "roboturk_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "viola", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "agentview_rgb", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "viola_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "berkeley_autolab_ur5", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "berkeley_autolab_ur5_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "toto", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "toto_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "language_table", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "rgb", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "language_table_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "stanford_hydra_dataset_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "stanford_hydra_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "austin_buds_dataset_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "austin_buds_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "nyu_franka_play_dataset_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "nyu_franka_play_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "furniture_bench_dataset_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "furniture_bench_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "austin_sailor_dataset_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "nav": null, |
| "high": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "austin_sailor_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "austin_sirius_dataset_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "nav": null, |
| "high": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "austin_sirius_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "bc_z", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "bc_z_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "dlr_edan_shared_control_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "dlr_edan_shared_control_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "iamlab_cmu_pickup_insert_converted_externally_to_rlds", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "iamlab_pick_insert_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "utaustin_mutex", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "utaustin_mutex_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "berkeley_fanuc_manipulation", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "berkeley_fanuc_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "cmu_stretch", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "cmu_stretch_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "droid", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "exterior_image_1_left", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "filter_functions": [ |
| { |
| "module": "experiments.homer.scripts.configs.cross_embodiment", |
| "name": "filter_success", |
| "args": [], |
| "kwargs": {} |
| } |
| ], |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "droid_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_pen_uncap_diverse_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_pen_uncap_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_dough_cut_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_dough_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_lucy_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_dough_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_drawer_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_dough_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_pick_place_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_dough_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_static_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_dough_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "aloha_sushi_cut_full_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": "cam_high", |
| "nav": null, |
| "left_wrist": "cam_left_wrist", |
| "right_wrist": "cam_right_wrist" |
| }, |
| "proprio_obs_keys": { |
| "bimanual": "proprio", |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "aloha_dough_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "bridge_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image_0", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "bridge_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "go1", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": "proprio" |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| true |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "go1_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "droid_wipe", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "exterior_image_2_left", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "droid_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "omnimimic_gnm_dataset", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": null, |
| "high": null, |
| "nav": "image", |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "omnimimic_gnm_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| }, |
| { |
| "name": "fractal20220817_data", |
| "data_dir": null, |
| "image_obs_keys": { |
| "primary": "image", |
| "high": null, |
| "nav": null, |
| "left_wrist": null, |
| "right_wrist": null |
| }, |
| "proprio_obs_keys": { |
| "bimanual": null, |
| "quadruped": null |
| }, |
| "proprio_obs_dims": { |
| "bimanual": 14, |
| "quadruped": 59 |
| }, |
| "action_normalization_mask": [ |
| true, |
| true, |
| true, |
| true, |
| true, |
| true, |
| false |
| ], |
| "language_key": "language_instruction", |
| "action_proprio_normalization_type": "normal", |
| "standardize_fn": { |
| "module": "crossformer.data.oxe.oxe_standardization_transforms", |
| "name": "rt1_dataset_transform", |
| "args": [], |
| "kwargs": {} |
| } |
| } |
| ], |
| "frame_transform_kwargs": { |
| "image_augment_kwargs": { |
| "high": { |
| "augment_order": [ |
| "random_resized_crop", |
| "random_brightness", |
| "random_contrast", |
| "random_saturation", |
| "random_hue" |
| ], |
| "random_brightness": [ |
| 0.1 |
| ], |
| "random_contrast": [ |
| 0.9, |
| 1.1 |
| ], |
| "random_hue": [ |
| 0.05 |
| ], |
| "random_resized_crop": { |
| "ratio": [ |
| 0.75, |
| 1.3333333333333333 |
| ], |
| "scale": [ |
| 0.9, |
| 1.0 |
| ] |
| }, |
| "random_saturation": [ |
| 0.9, |
| 1.1 |
| ] |
| }, |
| "left_wrist": { |
| "augment_order": [ |
| "random_resized_crop", |
| "random_brightness", |
| "random_contrast", |
| "random_saturation", |
| "random_hue" |
| ], |
| "random_brightness": [ |
| 0.1 |
| ], |
| "random_contrast": [ |
| 0.9, |
| 1.1 |
| ], |
| "random_hue": [ |
| 0.05 |
| ], |
| "random_resized_crop": { |
| "ratio": [ |
| 0.75, |
| 1.3333333333333333 |
| ], |
| "scale": [ |
| 0.9, |
| 1.0 |
| ] |
| }, |
| "random_saturation": [ |
| 0.9, |
| 1.1 |
| ] |
| }, |
| "nav": { |
| "augment_order": [ |
| "random_resized_crop", |
| "random_brightness", |
| "random_contrast", |
| "random_saturation", |
| "random_hue" |
| ], |
| "random_brightness": [ |
| 0.1 |
| ], |
| "random_contrast": [ |
| 0.9, |
| 1.1 |
| ], |
| "random_hue": [ |
| 0.05 |
| ], |
| "random_resized_crop": { |
| "ratio": [ |
| 0.9, |
| 1.1 |
| ], |
| "scale": [ |
| 0.8, |
| 1.0 |
| ] |
| }, |
| "random_saturation": [ |
| 0.9, |
| 1.1 |
| ] |
| }, |
| "primary": { |
| "augment_order": [ |
| "random_resized_crop", |
| "random_brightness", |
| "random_contrast", |
| "random_saturation", |
| "random_hue" |
| ], |
| "random_brightness": [ |
| 0.1 |
| ], |
| "random_contrast": [ |
| 0.9, |
| 1.1 |
| ], |
| "random_hue": [ |
| 0.05 |
| ], |
| "random_resized_crop": { |
| "ratio": [ |
| 0.9, |
| 1.1 |
| ], |
| "scale": [ |
| 0.8, |
| 1.0 |
| ] |
| }, |
| "random_saturation": [ |
| 0.9, |
| 1.1 |
| ] |
| }, |
| "right_wrist": { |
| "augment_order": [ |
| "random_resized_crop", |
| "random_brightness", |
| "random_contrast", |
| "random_saturation", |
| "random_hue" |
| ], |
| "random_brightness": [ |
| 0.1 |
| ], |
| "random_contrast": [ |
| 0.9, |
| 1.1 |
| ], |
| "random_hue": [ |
| 0.05 |
| ], |
| "random_resized_crop": { |
| "ratio": [ |
| 0.75, |
| 1.3333333333333333 |
| ], |
| "scale": [ |
| 0.9, |
| 1.0 |
| ] |
| }, |
| "random_saturation": [ |
| 0.9, |
| 1.1 |
| ] |
| } |
| }, |
| "num_parallel_calls": 200, |
| "resize_size": { |
| "high": [ |
| 224, |
| 224 |
| ], |
| "left_wrist": [ |
| 224, |
| 224 |
| ], |
| "nav": [ |
| 224, |
| 224 |
| ], |
| "primary": [ |
| 224, |
| 224 |
| ], |
| "right_wrist": [ |
| 224, |
| 224 |
| ] |
| } |
| }, |
| "sample_weights": [ |
| 0.021755552811740044, |
| 0.009986998241552502, |
| 0.0023179438302583103, |
| 0.0016371801232614254, |
| 0.0008888419195460733, |
| 0.007874885740329124, |
| 0.0032054418194781, |
| 0.004113224757060238, |
| 0.006839324427193265, |
| 0.01479473259297815, |
| 0.015045048015813084, |
| 0.0007163148639093663, |
| 0.002826978440249719, |
| 0.008290489894059044, |
| 0.007414589603576858, |
| 0.005878414243900214, |
| 0.021755552811740044, |
| 0.0001874782805166165, |
| 0.0030709017944702635, |
| 0.007599149035416076, |
| 0.0026296096724881066, |
| 0.0005253087662862543, |
| 0.0002175555281174004, |
| 0.085, |
| 0.014166666666666666, |
| 0.014166666666666666, |
| 0.014166666666666666, |
| 0.014166666666666666, |
| 0.014166666666666666, |
| 0.014166666666666666, |
| 0.17, |
| 0.085, |
| 0.085, |
| 0.17, |
| 0.17 |
| ], |
| "shuffle_buffer_size": 25000, |
| "traj_read_threads": 48, |
| "traj_transform_kwargs": { |
| "action_horizon": 100, |
| "goal_relabeling_kwargs": { |
| "max_goal_distance": 15 |
| }, |
| "goal_relabeling_strategy": "uniform", |
| "head_to_dataset": { |
| "bimanual": [ |
| "aloha_pen_uncap_diverse_dataset", |
| "aloha_dough_cut_dataset", |
| "aloha_lucy_dataset", |
| "aloha_drawer_dataset", |
| "aloha_pick_place_dataset", |
| "aloha_static_dataset", |
| "aloha_sushi_cut_full_dataset" |
| ], |
| "nav": [ |
| "omnimimic_gnm_dataset" |
| ], |
| "quadruped": [ |
| "go1" |
| ], |
| "single_arm": [ |
| "bridge_dataset", |
| "fractal20220817_data", |
| "kuka", |
| "taco_play", |
| "taco_extra", |
| "jaco_play", |
| "berkeley_cable_routing", |
| "roboturk", |
| "nyu_door_opening_surprising_effectiveness", |
| "viola", |
| "berkeley_autolab_ur5", |
| "toto", |
| "language_table", |
| "stanford_hydra_dataset_converted_externally_to_rlds", |
| "austin_buds_dataset_converted_externally_to_rlds", |
| "nyu_franka_play_dataset_converted_externally_to_rlds", |
| "furniture_bench_dataset_converted_externally_to_rlds", |
| "austin_sailor_dataset_converted_externally_to_rlds", |
| "austin_sirius_dataset_converted_externally_to_rlds", |
| "bc_z", |
| "dlr_edan_shared_control_converted_externally_to_rlds", |
| "iamlab_cmu_pickup_insert_converted_externally_to_rlds", |
| "utaustin_mutex", |
| "berkeley_fanuc_manipulation", |
| "cmu_stretch", |
| "droid", |
| "droid_wipe" |
| ] |
| }, |
| "max_action_dim": 14, |
| "subsample_length": 100, |
| "task_augment_kwargs": { |
| "keep_image_prob": 1.0 |
| }, |
| "task_augment_strategy": "delete_task_conditioning", |
| "window_size": 5 |
| }, |
| "traj_transform_threads": 48 |
| }, |
| "eval_datasets": [], |
| "eval_interval": 5e+20, |
| "log_interval": 500, |
| "model": { |
| "heads": { |
| "bimanual": { |
| "args": [], |
| "kwargs": { |
| "action_dim": 14, |
| "action_horizon": 100, |
| "clip_pred": false, |
| "constrain_loss_dims": true, |
| "loss_weight": 1.0, |
| "num_preds": 14, |
| "pool_strategy": "pass", |
| "readout_key": "readout_bimanual" |
| }, |
| "module": "crossformer.model.components.action_heads", |
| "name": "L1ActionHead" |
| }, |
| "nav": { |
| "args": [], |
| "kwargs": { |
| "action_dim": 2, |
| "action_horizon": 4, |
| "clip_pred": false, |
| "constrain_loss_dims": true, |
| "loss_weight": 1.0, |
| "num_preds": 2, |
| "pool_strategy": "pass", |
| "readout_key": "readout_nav" |
| }, |
| "module": "crossformer.model.components.action_heads", |
| "name": "L1ActionHead" |
| }, |
| "quadruped": { |
| "args": [], |
| "kwargs": { |
| "action_dim": 12, |
| "action_horizon": 1, |
| "clip_pred": false, |
| "constrain_loss_dims": true, |
| "loss_weight": 1.0, |
| "num_preds": 12, |
| "pool_strategy": "pass", |
| "readout_key": "readout_quadruped" |
| }, |
| "module": "crossformer.model.components.action_heads", |
| "name": "L1ActionHead" |
| }, |
| "single_arm": { |
| "args": [], |
| "kwargs": { |
| "action_dim": 7, |
| "action_horizon": 4, |
| "clip_pred": false, |
| "constrain_loss_dims": true, |
| "loss_weight": 1.0, |
| "num_preds": 7, |
| "pool_strategy": "pass", |
| "readout_key": "readout_single_arm" |
| }, |
| "module": "crossformer.model.components.action_heads", |
| "name": "L1ActionHead" |
| } |
| }, |
| "max_horizon": 10, |
| "observation_tokenizers": { |
| "bimanual": { |
| "args": [], |
| "kwargs": { |
| "dropout_rate": 0.2, |
| "obs_keys": [ |
| "proprio_bimanual" |
| ] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "LowdimObsTokenizer" |
| }, |
| "high": { |
| "args": [], |
| "kwargs": { |
| "encoder": { |
| "args": [], |
| "kwargs": {}, |
| "module": "crossformer.model.components.vit_encoders", |
| "name": "ResNet26FILM" |
| }, |
| "obs_stack_keys": [ |
| "image_high" |
| ], |
| "task_film_keys": [ |
| "language_instruction" |
| ], |
| "task_stack_keys": [ |
| "image_high" |
| ] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "ImageTokenizer" |
| }, |
| "left": { |
| "args": [], |
| "kwargs": { |
| "encoder": { |
| "args": [], |
| "kwargs": {}, |
| "module": "crossformer.model.components.vit_encoders", |
| "name": "ResNet26FILM" |
| }, |
| "obs_stack_keys": [ |
| "image_left_wrist" |
| ], |
| "task_film_keys": [ |
| "language_instruction" |
| ], |
| "task_stack_keys": [] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "ImageTokenizer" |
| }, |
| "nav": { |
| "args": [], |
| "kwargs": { |
| "encoder": { |
| "args": [], |
| "kwargs": {}, |
| "module": "crossformer.model.components.vit_encoders", |
| "name": "ResNet26" |
| }, |
| "obs_stack_keys": [ |
| "image_nav" |
| ], |
| "task_film_keys": [], |
| "task_stack_keys": [ |
| "image_nav" |
| ] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "ImageTokenizer" |
| }, |
| "primary": { |
| "args": [], |
| "kwargs": { |
| "encoder": { |
| "args": [], |
| "kwargs": {}, |
| "module": "crossformer.model.components.vit_encoders", |
| "name": "ResNet26FILM" |
| }, |
| "obs_stack_keys": [ |
| "image_primary" |
| ], |
| "task_film_keys": [ |
| "language_instruction" |
| ], |
| "task_stack_keys": [ |
| "image_primary" |
| ] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "ImageTokenizer" |
| }, |
| "quadruped": { |
| "args": [], |
| "kwargs": { |
| "obs_keys": [ |
| "proprio_quadruped" |
| ] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "LowdimObsTokenizer" |
| }, |
| "right": { |
| "args": [], |
| "kwargs": { |
| "encoder": { |
| "args": [], |
| "kwargs": {}, |
| "module": "crossformer.model.components.vit_encoders", |
| "name": "ResNet26FILM" |
| }, |
| "obs_stack_keys": [ |
| "image_right_wrist" |
| ], |
| "task_film_keys": [ |
| "language_instruction" |
| ], |
| "task_stack_keys": [] |
| }, |
| "module": "crossformer.model.components.tokenizers", |
| "name": "ImageTokenizer" |
| } |
| }, |
| "readouts": { |
| "bimanual": 100, |
| "nav": 4, |
| "quadruped": 1, |
| "single_arm": 4 |
| }, |
| "repeat_task_tokens": true, |
| "task_tokenizers": {}, |
| "token_embedding_size": 512, |
| "transformer_kwargs": { |
| "attention_dropout_rate": 0.0, |
| "dropout_rate": 0.1, |
| "mlp_dim": 2048, |
| "num_attention_heads": 8, |
| "num_layers": 12, |
| "repeat_pos_enc": true |
| } |
| }, |
| "num_steps": 300000, |
| "optimizer": { |
| "clip_gradient": 1.0, |
| "frozen_keys": [], |
| "learning_rate": { |
| "init_value": 0.0, |
| "name": "rsqrt", |
| "peak_value": 0.0003, |
| "timescale": 10000, |
| "warmup_steps": 2000 |
| }, |
| "weight_decay": 0.1 |
| }, |
| "prefetch_num_batches": 0, |
| "pretrained_loaders": [ |
| { |
| "module": "experiments.sudeep.aloha.resnet_pt", |
| "name": "resnet_26_loader", |
| "args": [], |
| "kwargs": { |
| "restore_path": "" |
| } |
| } |
| ], |
| "resume_path": null, |
| "save_dir": null, |
| "save_interval": 10000, |
| "seed": 42, |
| "skip_norm_keys": [ |
| "proprio_bimanual" |
| ], |
| "start_step": null, |
| "text_processor": { |
| "args": [], |
| "kwargs": {}, |
| "module": "crossformer.data.utils.text_processing", |
| "name": "UniversalSentenceEncoder" |
| }, |
| "val_kwargs": { |
| "num_val_batches": 16, |
| "val_shuffle_buffer_size": 1000 |
| }, |
| "viz_datasets": [], |
| "viz_interval": 5e+20, |
| "viz_kwargs": { |
| "eval_batch_size": 128, |
| "samples_per_state": 8, |
| "trajs_for_metrics": 100, |
| "trajs_for_viz": 8 |
| }, |
| "wandb": { |
| "entity": null, |
| "group": null, |
| "project": "crossformer" |
| }, |
| "wandb_resume_id": null, |
| "window_size": 5 |
| } |