Robotics
Transformers
Safetensors
RLDX-1
vla
vision-language-action
manipulation
flow-matching
rldx
robocasa
Instructions to use RLWRLD/RLDX-1-FT-RC365 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use RLWRLD/RLDX-1-FT-RC365 with Transformers:
# Load model directly from transformers import RLDX model = RLDX.from_pretrained("RLWRLD/RLDX-1-FT-RC365", dtype="auto") - Notebooks
- Google Colab
- Kaggle
| { | |
| "processor_class": "RLDXProcessor", | |
| "processor_kwargs": { | |
| "modality_configs": { | |
| "bridge_orig": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "secondary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "iamlab_cmu_pickup_insert_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "humanoid_everyday_g1": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "egocentric_resized" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "left_hand", | |
| "right_arm", | |
| "right_hand" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "left_hand", | |
| "right_arm", | |
| "right_hand" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "dlr_edan_shared_control_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "austin_sailor_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "berkeley_autolab_ur5": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "fractal20220817_data": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "cmu_stretch": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "berkeley_cable_routing": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "secondary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "stanford_hydra_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "utaustin_mutex": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "furniture_bench_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "neural_gr1": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "ego_view" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "left_hand", | |
| "left_leg", | |
| "neck", | |
| "right_arm", | |
| "right_hand", | |
| "right_leg", | |
| "waist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "left_hand", | |
| "left_leg", | |
| "neck", | |
| "right_arm", | |
| "right_hand", | |
| "right_leg", | |
| "waist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "agibot_gripper": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist_left", | |
| "wrist_right" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "state" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "action" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "fmb_dataset": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "secondary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "dobbe": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "viola": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "humanoid_everyday_h1": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "egocentric_resized" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "left_hand", | |
| "right_arm", | |
| "right_hand" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "left_arm", | |
| "left_hand", | |
| "right_arm", | |
| "right_hand" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "austin_buds_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "taco_play": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "toto": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "language_table": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "nyu_franka_play_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "secondary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "ucsd_kitchen_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "austin_sirius_dataset_converted_externally_to_rlds": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "droid": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "secondary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "bc_z": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "kuka": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "agibot_dexhand": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "state" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "action" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "action_net": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "state" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "action" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "galaxea": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist_left", | |
| "wrist_right" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "state" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "action" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "roboturk": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "none" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "berkeley_fanuc_manipulation": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "joint_position", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "jaco_play": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "primary", | |
| "wrist" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_position" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.action.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| }, | |
| "general_embodiment": { | |
| "video": { | |
| "delta_indices": [ | |
| -6, | |
| -4, | |
| -2, | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "robot0_agentview_left", | |
| "robot0_agentview_right", | |
| "robot0_eye_in_hand" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "state": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position_relative", | |
| "end_effector_rotation_relative", | |
| "gripper_qpos", | |
| "base_position", | |
| "base_rotation" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| }, | |
| "action": { | |
| "delta_indices": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15 | |
| ], | |
| "modality_keys": [ | |
| "end_effector_position", | |
| "end_effector_rotation", | |
| "gripper_close", | |
| "base_motion", | |
| "control_mode" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": [ | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "DELTA", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| }, | |
| { | |
| "rep": "ABSOLUTE", | |
| "type": "NON_EEF", | |
| "format": "DEFAULT", | |
| "state_key": null | |
| } | |
| ] | |
| }, | |
| "language": { | |
| "delta_indices": [ | |
| 0 | |
| ], | |
| "modality_keys": [ | |
| "annotation.human.task_description" | |
| ], | |
| "sin_cos_embedding_keys": null, | |
| "mean_std_embedding_keys": null, | |
| "action_configs": null | |
| } | |
| } | |
| }, | |
| "random_rotation_angle": null, | |
| "color_jitter_params": { | |
| "brightness": 0.3, | |
| "contrast": 0.4, | |
| "saturation": 0.5, | |
| "hue": 0.08 | |
| }, | |
| "model_name": "RLWRLD/RLDX-1-VLM", | |
| "model_type": "vtc_qwen3_vl", | |
| "formalize_language": true, | |
| "max_state_dim": 64, | |
| "max_action_dim": 64, | |
| "max_action_horizon": 16, | |
| "use_percentiles": true, | |
| "clip_outliers": true, | |
| "apply_sincos_state_encoding": false, | |
| "use_relative_action": true, | |
| "memory_length": 1, | |
| "general_embodiment_train_ratio": 0, | |
| "random_crop_fraction": 1.0, | |
| "image_max_area": null, | |
| "image_resize_m": 32 | |
| } | |
| } |