crossformer / config.json
rail-berkeley's picture
Upload config.json
bd5ed29 verified
{
"dataset_kwargs": {
"balance_weights": false,
"batch_size": 8,
"dataset_kwargs_list": [
{
"name": "kuka",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "kuka_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "taco_play",
"data_dir": null,
"image_obs_keys": {
"primary": "rgb_static",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "taco_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "taco_extra",
"data_dir": null,
"image_obs_keys": {
"primary": "rgb_static",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "taco_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "jaco_play",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "jaco_play_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "berkeley_cable_routing",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "berkeley_cable_routing_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "roboturk",
"data_dir": null,
"image_obs_keys": {
"primary": "front_rgb",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "roboturk_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "viola",
"data_dir": null,
"image_obs_keys": {
"primary": "agentview_rgb",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "viola_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "berkeley_autolab_ur5",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "berkeley_autolab_ur5_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "toto",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "toto_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "language_table",
"data_dir": null,
"image_obs_keys": {
"primary": "rgb",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "language_table_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "stanford_hydra_dataset_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "stanford_hydra_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "austin_buds_dataset_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "austin_buds_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "nyu_franka_play_dataset_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "nyu_franka_play_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "furniture_bench_dataset_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "furniture_bench_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "austin_sailor_dataset_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"nav": null,
"high": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "austin_sailor_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "austin_sirius_dataset_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"nav": null,
"high": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "austin_sirius_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "bc_z",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "bc_z_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "dlr_edan_shared_control_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "dlr_edan_shared_control_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "iamlab_cmu_pickup_insert_converted_externally_to_rlds",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "iamlab_pick_insert_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "utaustin_mutex",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "utaustin_mutex_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "berkeley_fanuc_manipulation",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "berkeley_fanuc_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "cmu_stretch",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "cmu_stretch_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "droid",
"data_dir": null,
"image_obs_keys": {
"primary": "exterior_image_1_left",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"filter_functions": [
{
"module": "experiments.homer.scripts.configs.cross_embodiment",
"name": "filter_success",
"args": [],
"kwargs": {}
}
],
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "droid_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_pen_uncap_diverse_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_pen_uncap_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_dough_cut_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_dough_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_lucy_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_dough_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_drawer_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_dough_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_pick_place_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_dough_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_static_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_dough_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "aloha_sushi_cut_full_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": "cam_high",
"nav": null,
"left_wrist": "cam_left_wrist",
"right_wrist": "cam_right_wrist"
},
"proprio_obs_keys": {
"bimanual": "proprio",
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false,
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "aloha_dough_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "bridge_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": "image_0",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "bridge_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "go1",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": "proprio"
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
true,
true,
true,
true,
true,
true
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "go1_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "droid_wipe",
"data_dir": null,
"image_obs_keys": {
"primary": "exterior_image_2_left",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "droid_dataset_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "omnimimic_gnm_dataset",
"data_dir": null,
"image_obs_keys": {
"primary": null,
"high": null,
"nav": "image",
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "omnimimic_gnm_transform",
"args": [],
"kwargs": {}
}
},
{
"name": "fractal20220817_data",
"data_dir": null,
"image_obs_keys": {
"primary": "image",
"high": null,
"nav": null,
"left_wrist": null,
"right_wrist": null
},
"proprio_obs_keys": {
"bimanual": null,
"quadruped": null
},
"proprio_obs_dims": {
"bimanual": 14,
"quadruped": 59
},
"action_normalization_mask": [
true,
true,
true,
true,
true,
true,
false
],
"language_key": "language_instruction",
"action_proprio_normalization_type": "normal",
"standardize_fn": {
"module": "crossformer.data.oxe.oxe_standardization_transforms",
"name": "rt1_dataset_transform",
"args": [],
"kwargs": {}
}
}
],
"frame_transform_kwargs": {
"image_augment_kwargs": {
"high": {
"augment_order": [
"random_resized_crop",
"random_brightness",
"random_contrast",
"random_saturation",
"random_hue"
],
"random_brightness": [
0.1
],
"random_contrast": [
0.9,
1.1
],
"random_hue": [
0.05
],
"random_resized_crop": {
"ratio": [
0.75,
1.3333333333333333
],
"scale": [
0.9,
1.0
]
},
"random_saturation": [
0.9,
1.1
]
},
"left_wrist": {
"augment_order": [
"random_resized_crop",
"random_brightness",
"random_contrast",
"random_saturation",
"random_hue"
],
"random_brightness": [
0.1
],
"random_contrast": [
0.9,
1.1
],
"random_hue": [
0.05
],
"random_resized_crop": {
"ratio": [
0.75,
1.3333333333333333
],
"scale": [
0.9,
1.0
]
},
"random_saturation": [
0.9,
1.1
]
},
"nav": {
"augment_order": [
"random_resized_crop",
"random_brightness",
"random_contrast",
"random_saturation",
"random_hue"
],
"random_brightness": [
0.1
],
"random_contrast": [
0.9,
1.1
],
"random_hue": [
0.05
],
"random_resized_crop": {
"ratio": [
0.9,
1.1
],
"scale": [
0.8,
1.0
]
},
"random_saturation": [
0.9,
1.1
]
},
"primary": {
"augment_order": [
"random_resized_crop",
"random_brightness",
"random_contrast",
"random_saturation",
"random_hue"
],
"random_brightness": [
0.1
],
"random_contrast": [
0.9,
1.1
],
"random_hue": [
0.05
],
"random_resized_crop": {
"ratio": [
0.9,
1.1
],
"scale": [
0.8,
1.0
]
},
"random_saturation": [
0.9,
1.1
]
},
"right_wrist": {
"augment_order": [
"random_resized_crop",
"random_brightness",
"random_contrast",
"random_saturation",
"random_hue"
],
"random_brightness": [
0.1
],
"random_contrast": [
0.9,
1.1
],
"random_hue": [
0.05
],
"random_resized_crop": {
"ratio": [
0.75,
1.3333333333333333
],
"scale": [
0.9,
1.0
]
},
"random_saturation": [
0.9,
1.1
]
}
},
"num_parallel_calls": 200,
"resize_size": {
"high": [
224,
224
],
"left_wrist": [
224,
224
],
"nav": [
224,
224
],
"primary": [
224,
224
],
"right_wrist": [
224,
224
]
}
},
"sample_weights": [
0.021755552811740044,
0.009986998241552502,
0.0023179438302583103,
0.0016371801232614254,
0.0008888419195460733,
0.007874885740329124,
0.0032054418194781,
0.004113224757060238,
0.006839324427193265,
0.01479473259297815,
0.015045048015813084,
0.0007163148639093663,
0.002826978440249719,
0.008290489894059044,
0.007414589603576858,
0.005878414243900214,
0.021755552811740044,
0.0001874782805166165,
0.0030709017944702635,
0.007599149035416076,
0.0026296096724881066,
0.0005253087662862543,
0.0002175555281174004,
0.085,
0.014166666666666666,
0.014166666666666666,
0.014166666666666666,
0.014166666666666666,
0.014166666666666666,
0.014166666666666666,
0.17,
0.085,
0.085,
0.17,
0.17
],
"shuffle_buffer_size": 25000,
"traj_read_threads": 48,
"traj_transform_kwargs": {
"action_horizon": 100,
"goal_relabeling_kwargs": {
"max_goal_distance": 15
},
"goal_relabeling_strategy": "uniform",
"head_to_dataset": {
"bimanual": [
"aloha_pen_uncap_diverse_dataset",
"aloha_dough_cut_dataset",
"aloha_lucy_dataset",
"aloha_drawer_dataset",
"aloha_pick_place_dataset",
"aloha_static_dataset",
"aloha_sushi_cut_full_dataset"
],
"nav": [
"omnimimic_gnm_dataset"
],
"quadruped": [
"go1"
],
"single_arm": [
"bridge_dataset",
"fractal20220817_data",
"kuka",
"taco_play",
"taco_extra",
"jaco_play",
"berkeley_cable_routing",
"roboturk",
"nyu_door_opening_surprising_effectiveness",
"viola",
"berkeley_autolab_ur5",
"toto",
"language_table",
"stanford_hydra_dataset_converted_externally_to_rlds",
"austin_buds_dataset_converted_externally_to_rlds",
"nyu_franka_play_dataset_converted_externally_to_rlds",
"furniture_bench_dataset_converted_externally_to_rlds",
"austin_sailor_dataset_converted_externally_to_rlds",
"austin_sirius_dataset_converted_externally_to_rlds",
"bc_z",
"dlr_edan_shared_control_converted_externally_to_rlds",
"iamlab_cmu_pickup_insert_converted_externally_to_rlds",
"utaustin_mutex",
"berkeley_fanuc_manipulation",
"cmu_stretch",
"droid",
"droid_wipe"
]
},
"max_action_dim": 14,
"subsample_length": 100,
"task_augment_kwargs": {
"keep_image_prob": 1.0
},
"task_augment_strategy": "delete_task_conditioning",
"window_size": 5
},
"traj_transform_threads": 48
},
"eval_datasets": [],
"eval_interval": 5e+20,
"log_interval": 500,
"model": {
"heads": {
"bimanual": {
"args": [],
"kwargs": {
"action_dim": 14,
"action_horizon": 100,
"clip_pred": false,
"constrain_loss_dims": true,
"loss_weight": 1.0,
"num_preds": 14,
"pool_strategy": "pass",
"readout_key": "readout_bimanual"
},
"module": "crossformer.model.components.action_heads",
"name": "L1ActionHead"
},
"nav": {
"args": [],
"kwargs": {
"action_dim": 2,
"action_horizon": 4,
"clip_pred": false,
"constrain_loss_dims": true,
"loss_weight": 1.0,
"num_preds": 2,
"pool_strategy": "pass",
"readout_key": "readout_nav"
},
"module": "crossformer.model.components.action_heads",
"name": "L1ActionHead"
},
"quadruped": {
"args": [],
"kwargs": {
"action_dim": 12,
"action_horizon": 1,
"clip_pred": false,
"constrain_loss_dims": true,
"loss_weight": 1.0,
"num_preds": 12,
"pool_strategy": "pass",
"readout_key": "readout_quadruped"
},
"module": "crossformer.model.components.action_heads",
"name": "L1ActionHead"
},
"single_arm": {
"args": [],
"kwargs": {
"action_dim": 7,
"action_horizon": 4,
"clip_pred": false,
"constrain_loss_dims": true,
"loss_weight": 1.0,
"num_preds": 7,
"pool_strategy": "pass",
"readout_key": "readout_single_arm"
},
"module": "crossformer.model.components.action_heads",
"name": "L1ActionHead"
}
},
"max_horizon": 10,
"observation_tokenizers": {
"bimanual": {
"args": [],
"kwargs": {
"dropout_rate": 0.2,
"obs_keys": [
"proprio_bimanual"
]
},
"module": "crossformer.model.components.tokenizers",
"name": "LowdimObsTokenizer"
},
"high": {
"args": [],
"kwargs": {
"encoder": {
"args": [],
"kwargs": {},
"module": "crossformer.model.components.vit_encoders",
"name": "ResNet26FILM"
},
"obs_stack_keys": [
"image_high"
],
"task_film_keys": [
"language_instruction"
],
"task_stack_keys": [
"image_high"
]
},
"module": "crossformer.model.components.tokenizers",
"name": "ImageTokenizer"
},
"left": {
"args": [],
"kwargs": {
"encoder": {
"args": [],
"kwargs": {},
"module": "crossformer.model.components.vit_encoders",
"name": "ResNet26FILM"
},
"obs_stack_keys": [
"image_left_wrist"
],
"task_film_keys": [
"language_instruction"
],
"task_stack_keys": []
},
"module": "crossformer.model.components.tokenizers",
"name": "ImageTokenizer"
},
"nav": {
"args": [],
"kwargs": {
"encoder": {
"args": [],
"kwargs": {},
"module": "crossformer.model.components.vit_encoders",
"name": "ResNet26"
},
"obs_stack_keys": [
"image_nav"
],
"task_film_keys": [],
"task_stack_keys": [
"image_nav"
]
},
"module": "crossformer.model.components.tokenizers",
"name": "ImageTokenizer"
},
"primary": {
"args": [],
"kwargs": {
"encoder": {
"args": [],
"kwargs": {},
"module": "crossformer.model.components.vit_encoders",
"name": "ResNet26FILM"
},
"obs_stack_keys": [
"image_primary"
],
"task_film_keys": [
"language_instruction"
],
"task_stack_keys": [
"image_primary"
]
},
"module": "crossformer.model.components.tokenizers",
"name": "ImageTokenizer"
},
"quadruped": {
"args": [],
"kwargs": {
"obs_keys": [
"proprio_quadruped"
]
},
"module": "crossformer.model.components.tokenizers",
"name": "LowdimObsTokenizer"
},
"right": {
"args": [],
"kwargs": {
"encoder": {
"args": [],
"kwargs": {},
"module": "crossformer.model.components.vit_encoders",
"name": "ResNet26FILM"
},
"obs_stack_keys": [
"image_right_wrist"
],
"task_film_keys": [
"language_instruction"
],
"task_stack_keys": []
},
"module": "crossformer.model.components.tokenizers",
"name": "ImageTokenizer"
}
},
"readouts": {
"bimanual": 100,
"nav": 4,
"quadruped": 1,
"single_arm": 4
},
"repeat_task_tokens": true,
"task_tokenizers": {},
"token_embedding_size": 512,
"transformer_kwargs": {
"attention_dropout_rate": 0.0,
"dropout_rate": 0.1,
"mlp_dim": 2048,
"num_attention_heads": 8,
"num_layers": 12,
"repeat_pos_enc": true
}
},
"num_steps": 300000,
"optimizer": {
"clip_gradient": 1.0,
"frozen_keys": [],
"learning_rate": {
"init_value": 0.0,
"name": "rsqrt",
"peak_value": 0.0003,
"timescale": 10000,
"warmup_steps": 2000
},
"weight_decay": 0.1
},
"prefetch_num_batches": 0,
"pretrained_loaders": [
{
"module": "experiments.sudeep.aloha.resnet_pt",
"name": "resnet_26_loader",
"args": [],
"kwargs": {
"restore_path": ""
}
}
],
"resume_path": null,
"save_dir": null,
"save_interval": 10000,
"seed": 42,
"skip_norm_keys": [
"proprio_bimanual"
],
"start_step": null,
"text_processor": {
"args": [],
"kwargs": {},
"module": "crossformer.data.utils.text_processing",
"name": "UniversalSentenceEncoder"
},
"val_kwargs": {
"num_val_batches": 16,
"val_shuffle_buffer_size": 1000
},
"viz_datasets": [],
"viz_interval": 5e+20,
"viz_kwargs": {
"eval_batch_size": 128,
"samples_per_state": 8,
"trajs_for_metrics": 100,
"trajs_for_viz": 8
},
"wandb": {
"entity": null,
"group": null,
"project": "crossformer"
},
"wandb_resume_id": null,
"window_size": 5
}