eval
Browse files- cross_peginsertionside/best_model.zip +3 -0
- cross_peginsertionside/params/agent.yaml +104 -0
- cross_stackcube/best_model.zip +3 -0
- cross_stackcube/params/agent.yaml +104 -0
- cross_tworobotstackcube/best_model.zip +3 -0
- cross_tworobotstackcube/params/agent.yaml +99 -0
- cross_unitreeg1transportbox/best_model.zip +3 -0
- cross_unitreeg1transportbox/params/agent.yaml +104 -0
- lstm_peginsertionside/best_model.zip +3 -0
- lstm_peginsertionside/params/agent.yaml +94 -0
- lstm_stackcube/best_model.zip +3 -0
- lstm_stackcube/params/agent.yaml +94 -0
- lstm_tworobotstackcube/best_model.zip +3 -0
- lstm_tworobotstackcube/params/agent.yaml +89 -0
- lstm_unitreeg1transportbox/best_model.zip +3 -0
- lstm_unitreeg1transportbox/params/agent.yaml +94 -0
- none_peginsertionside/best_model.zip +3 -0
- none_peginsertionside/params/agent.yaml +104 -0
- none_stackcube/best_model.zip +3 -0
- none_stackcube/params/agent.yaml +98 -0
- none_tworobotstackcube/best_model.zip +3 -0
- none_tworobotstackcube/params/agent.yaml +99 -0
- none_unitreeg1transportbox/best_model.zip +3 -0
- none_unitreeg1transportbox/params/agent.yaml +104 -0
- sta_peginsertionside/best_model.zip +3 -0
- sta_peginsertionside/params/agent.yaml +98 -0
- sta_peginsertionside_noisy/best_model.zip +3 -0
- sta_peginsertionside_noisy/params/agent.yaml +104 -0
- sta_stackcube/best_model.zip +3 -0
- sta_stackcube/params/agent.yaml +104 -0
- sta_stackcube_noisy/best_model.zip +3 -0
- sta_stackcube_noisy/params/agent.yaml +104 -0
- sta_tworobotstackcube/best_model.zip +3 -0
- sta_tworobotstackcube/params/agent.yaml +99 -0
- sta_tworobotstackcube_noisy/best_model.zip +3 -0
- sta_tworobotstackcube_noisy/params/agent.yaml +99 -0
- sta_unitreeg1transportbox/best_model.zip +3 -0
- sta_unitreeg1transportbox/params/agent.yaml +104 -0
- sta_unitreeg1transportbox_noisy/best_model.zip +3 -0
- sta_unitreeg1transportbox_noisy/params/agent.yaml +104 -0
- tcn_peginsertionside/best_model.zip +3 -0
- tcn_peginsertionside/params/agent.yaml +94 -0
- tcn_stackcube/best_model.zip +3 -0
- tcn_stackcube/params/agent.yaml +94 -0
- tcn_tworobotstackcube/best_model.zip +3 -0
- tcn_tworobotstackcube/params/agent.yaml +89 -0
- tcn_unitreeg1transportbox/best_model.zip +3 -0
- tcn_unitreeg1transportbox/params/agent.yaml +94 -0
cross_peginsertionside/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4236675d6537384de34ae6b135dbc3704e16feea0e1de27cb46723ceb0caab6a
|
| 3 |
+
size 93175179
|
cross_peginsertionside/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: PegInsertionSide-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: PegInsertionSide-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.hand_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 9
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 8
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
cross_stackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eda55ea9e1f8307ee644bd07811ecfa905b19768cf8af8da8825ea015ad98c21
|
| 3 |
+
size 93175118
|
cross_stackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: StackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: StackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.hand_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 9
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 30
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 8
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
cross_tworobotstackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41ca41133e0f04e72bf55945157c3adf1191e52a018134a4c8155b07d80df57e
|
| 3 |
+
size 93219135
|
cross_tworobotstackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: TwoRobotStackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: TwoRobotStackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.image: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.state: !!python/tuple
|
| 80 |
+
- 18
|
| 81 |
+
observation.privileged: !!python/tuple
|
| 82 |
+
- 40
|
| 83 |
+
output_shapes:
|
| 84 |
+
action: !!python/tuple
|
| 85 |
+
- 16
|
| 86 |
+
- 16
|
| 87 |
+
normalization:
|
| 88 |
+
observation_modes:
|
| 89 |
+
observation.state: min_max
|
| 90 |
+
action_modes:
|
| 91 |
+
action: min_max
|
| 92 |
+
fps: 20
|
| 93 |
+
delta_timestamps:
|
| 94 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 95 |
+
observation.image: '[i / 20 for i in range(16)]'
|
| 96 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 97 |
+
action: '[i / 20 for i in range(16)]'
|
| 98 |
+
image_transforms:
|
| 99 |
+
enable: false
|
cross_unitreeg1transportbox/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a72cbc84bd0d33c7bb3dbb7a3858e05a7014b8b93a369c03699909f5c335a3a
|
| 3 |
+
size 93255978
|
cross_unitreeg1transportbox/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: UnitreeG1TransportBox-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: UnitreeG1TransportBox-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.head_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 25
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 25
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.head_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
lstm_peginsertionside/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:481b2a2417fd1ac3aa8691f7ba906efe587dd0fc67e9231a509b4d883d828714
|
| 3 |
+
size 42676885
|
lstm_peginsertionside/params/agent.yaml
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: LSTMPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: PegInsertionSide-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: PegInsertionSide-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.images.base_camera: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.images.hand_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.state: !!python/tuple
|
| 74 |
+
- 9
|
| 75 |
+
observation.privileged: !!python/tuple
|
| 76 |
+
- 27
|
| 77 |
+
output_shapes:
|
| 78 |
+
action: !!python/tuple
|
| 79 |
+
- 16
|
| 80 |
+
- 8
|
| 81 |
+
normalization:
|
| 82 |
+
observation_modes:
|
| 83 |
+
observation.state: min_max
|
| 84 |
+
action_modes:
|
| 85 |
+
action: min_max
|
| 86 |
+
fps: 20
|
| 87 |
+
delta_timestamps:
|
| 88 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 89 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 90 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 91 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 92 |
+
action: '[i / 20 for i in range(16)]'
|
| 93 |
+
image_transforms:
|
| 94 |
+
enable: false
|
lstm_stackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3863c1d750feb2d79aa18c36d2d7c895f24d9e9dd48b1d6c45747f98ec459665
|
| 3 |
+
size 42676824
|
lstm_stackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: LSTMPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: StackCube-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: StackCube-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.images.base_camera: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.images.hand_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.state: !!python/tuple
|
| 74 |
+
- 9
|
| 75 |
+
observation.privileged: !!python/tuple
|
| 76 |
+
- 30
|
| 77 |
+
output_shapes:
|
| 78 |
+
action: !!python/tuple
|
| 79 |
+
- 16
|
| 80 |
+
- 8
|
| 81 |
+
normalization:
|
| 82 |
+
observation_modes:
|
| 83 |
+
observation.state: min_max
|
| 84 |
+
action_modes:
|
| 85 |
+
action: min_max
|
| 86 |
+
fps: 20
|
| 87 |
+
delta_timestamps:
|
| 88 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 89 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 90 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 91 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 92 |
+
action: '[i / 20 for i in range(16)]'
|
| 93 |
+
image_transforms:
|
| 94 |
+
enable: false
|
lstm_tworobotstackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:60c1de3094b962f8eaf3c7d9faf96e59e9eb92431850cc59d3798c9f5b4b6bfd
|
| 3 |
+
size 41653831
|
lstm_tworobotstackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,89 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: LSTMPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: TwoRobotStackCube-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: TwoRobotStackCube-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.image: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.state: !!python/tuple
|
| 70 |
+
- 18
|
| 71 |
+
observation.privileged: !!python/tuple
|
| 72 |
+
- 40
|
| 73 |
+
output_shapes:
|
| 74 |
+
action: !!python/tuple
|
| 75 |
+
- 16
|
| 76 |
+
- 16
|
| 77 |
+
normalization:
|
| 78 |
+
observation_modes:
|
| 79 |
+
observation.state: min_max
|
| 80 |
+
action_modes:
|
| 81 |
+
action: min_max
|
| 82 |
+
fps: 20
|
| 83 |
+
delta_timestamps:
|
| 84 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 85 |
+
observation.image: '[i / 20 for i in range(16)]'
|
| 86 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 87 |
+
action: '[i / 20 for i in range(16)]'
|
| 88 |
+
image_transforms:
|
| 89 |
+
enable: false
|
lstm_unitreeg1transportbox/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f2f44037adaebbebfa4cfd8f3ccdf07d068616a1475763bb49bc53964af02be
|
| 3 |
+
size 42724986
|
lstm_unitreeg1transportbox/params/agent.yaml
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: LSTMPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: UnitreeG1TransportBox-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: UnitreeG1TransportBox-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.images.base_camera: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.images.head_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.state: !!python/tuple
|
| 74 |
+
- 25
|
| 75 |
+
observation.privileged: !!python/tuple
|
| 76 |
+
- 27
|
| 77 |
+
output_shapes:
|
| 78 |
+
action: !!python/tuple
|
| 79 |
+
- 16
|
| 80 |
+
- 25
|
| 81 |
+
normalization:
|
| 82 |
+
observation_modes:
|
| 83 |
+
observation.state: min_max
|
| 84 |
+
action_modes:
|
| 85 |
+
action: min_max
|
| 86 |
+
fps: 20
|
| 87 |
+
delta_timestamps:
|
| 88 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 89 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 90 |
+
observation.images.head_camera: '[i / 20 for i in range(16)]'
|
| 91 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 92 |
+
action: '[i / 20 for i in range(16)]'
|
| 93 |
+
image_transforms:
|
| 94 |
+
enable: false
|
none_peginsertionside/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91f462488160c8089ccd2e7071f566291b1a24f0fba9748a749682b9797d7ffc
|
| 3 |
+
size 93175181
|
none_peginsertionside/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: false
|
| 22 |
+
ca_att: false
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: PegInsertionSide-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: PegInsertionSide-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.hand_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 9
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 8
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
none_stackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c991aac3d9207510a2a021c9d6c3b93c17ea6a015c3bfb393830eee59ee9d277
|
| 3 |
+
size 93175121
|
none_stackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,98 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 200
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: TransformerPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_flag: false
|
| 22 |
+
ca_flag: false
|
| 23 |
+
sta_flag: false
|
| 24 |
+
sta_residual: false
|
| 25 |
+
sta_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Agent
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
observation_modes:
|
| 39 |
+
observation.state: min_max
|
| 40 |
+
action_modes:
|
| 41 |
+
action: min_max
|
| 42 |
+
overwrite_stats: false
|
| 43 |
+
stats: null
|
| 44 |
+
data_key_map:
|
| 45 |
+
observation.images.base_camera: cam1
|
| 46 |
+
observation.images.hand_camera: cam2
|
| 47 |
+
observation.images.head_camera: cam2
|
| 48 |
+
observation.images.image_side_1: cam1
|
| 49 |
+
observation.images.image_side_2: cam2
|
| 50 |
+
observation.images.image_wrist_1: cam3
|
| 51 |
+
observation.images.image_wrist_2: cam4
|
| 52 |
+
observation.top: cam1
|
| 53 |
+
image: cam1
|
| 54 |
+
wrist_image: cam2
|
| 55 |
+
observation.state: state
|
| 56 |
+
state: state
|
| 57 |
+
action: action
|
| 58 |
+
actions: action
|
| 59 |
+
task: StackCube-v1
|
| 60 |
+
env_cfg:
|
| 61 |
+
name: maniskill
|
| 62 |
+
task: StackCube-v1
|
| 63 |
+
dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
|
| 64 |
+
episodes: null
|
| 65 |
+
dataset_revision: v2.0
|
| 66 |
+
dataset_root: null
|
| 67 |
+
video_backend: pyav
|
| 68 |
+
input_shapes:
|
| 69 |
+
observation.images.base_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.images.hand_camera: !!python/tuple
|
| 74 |
+
- 480
|
| 75 |
+
- 640
|
| 76 |
+
- 3
|
| 77 |
+
observation.state: !!python/tuple
|
| 78 |
+
- 9
|
| 79 |
+
observation.privileged: !!python/tuple
|
| 80 |
+
- 30
|
| 81 |
+
output_shapes:
|
| 82 |
+
action: !!python/tuple
|
| 83 |
+
- 16
|
| 84 |
+
- 8
|
| 85 |
+
normalization:
|
| 86 |
+
observation_modes:
|
| 87 |
+
observation.state: min_max
|
| 88 |
+
action_modes:
|
| 89 |
+
action: min_max
|
| 90 |
+
fps: 20
|
| 91 |
+
delta_timestamps:
|
| 92 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 93 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 94 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 95 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 96 |
+
action: '[i / 20 for i in range(16)]'
|
| 97 |
+
image_transforms:
|
| 98 |
+
enable: false
|
none_tworobotstackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38bef25c60cb946966c5c56ea2d881437e4e2dcf3bb82aaa3da0b21e62c08c3f
|
| 3 |
+
size 93219134
|
none_tworobotstackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: false
|
| 22 |
+
ca_att: false
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: TwoRobotStackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: TwoRobotStackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.image: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.state: !!python/tuple
|
| 80 |
+
- 18
|
| 81 |
+
observation.privileged: !!python/tuple
|
| 82 |
+
- 40
|
| 83 |
+
output_shapes:
|
| 84 |
+
action: !!python/tuple
|
| 85 |
+
- 16
|
| 86 |
+
- 16
|
| 87 |
+
normalization:
|
| 88 |
+
observation_modes:
|
| 89 |
+
observation.state: min_max
|
| 90 |
+
action_modes:
|
| 91 |
+
action: min_max
|
| 92 |
+
fps: 20
|
| 93 |
+
delta_timestamps:
|
| 94 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 95 |
+
observation.image: '[i / 20 for i in range(16)]'
|
| 96 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 97 |
+
action: '[i / 20 for i in range(16)]'
|
| 98 |
+
image_transforms:
|
| 99 |
+
enable: false
|
none_unitreeg1transportbox/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0274a2dee4c158384796bc95b982f4194839e004951a7ea39759a56c933889f5
|
| 3 |
+
size 93255981
|
none_unitreeg1transportbox/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: false
|
| 22 |
+
ca_att: false
|
| 23 |
+
army_att: false
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: UnitreeG1TransportBox-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: UnitreeG1TransportBox-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.head_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 25
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 25
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.head_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
sta_peginsertionside/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e4814f84dab65674c120a46a2fb252580538f57f43bc8323849a7fc62348c41
|
| 3 |
+
size 93175183
|
sta_peginsertionside/params/agent.yaml
ADDED
|
@@ -0,0 +1,98 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 200
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: TransformerPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_flag: true
|
| 22 |
+
ca_flag: true
|
| 23 |
+
sta_flag: true
|
| 24 |
+
sta_residual: false
|
| 25 |
+
sta_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: true
|
| 32 |
+
preprocessor_class: Lerobot_2_Agent
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
observation_modes:
|
| 39 |
+
observation.state: min_max
|
| 40 |
+
action_modes:
|
| 41 |
+
action: min_max
|
| 42 |
+
overwrite_stats: false
|
| 43 |
+
stats: null
|
| 44 |
+
data_key_map:
|
| 45 |
+
observation.images.base_camera: cam1
|
| 46 |
+
observation.images.hand_camera: cam2
|
| 47 |
+
observation.images.head_camera: cam2
|
| 48 |
+
observation.images.image_side_1: cam1
|
| 49 |
+
observation.images.image_side_2: cam2
|
| 50 |
+
observation.images.image_wrist_1: cam3
|
| 51 |
+
observation.images.image_wrist_2: cam4
|
| 52 |
+
observation.top: cam1
|
| 53 |
+
image: cam1
|
| 54 |
+
wrist_image: cam2
|
| 55 |
+
observation.state: state
|
| 56 |
+
state: state
|
| 57 |
+
action: action
|
| 58 |
+
actions: action
|
| 59 |
+
task: PegInsertionSide-v1
|
| 60 |
+
env_cfg:
|
| 61 |
+
name: maniskill
|
| 62 |
+
task: PegInsertionSide-v1
|
| 63 |
+
dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
|
| 64 |
+
episodes: null
|
| 65 |
+
dataset_revision: v2.0
|
| 66 |
+
dataset_root: null
|
| 67 |
+
video_backend: pyav
|
| 68 |
+
input_shapes:
|
| 69 |
+
observation.images.base_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.images.hand_camera: !!python/tuple
|
| 74 |
+
- 480
|
| 75 |
+
- 640
|
| 76 |
+
- 3
|
| 77 |
+
observation.state: !!python/tuple
|
| 78 |
+
- 9
|
| 79 |
+
observation.privileged: !!python/tuple
|
| 80 |
+
- 27
|
| 81 |
+
output_shapes:
|
| 82 |
+
action: !!python/tuple
|
| 83 |
+
- 16
|
| 84 |
+
- 8
|
| 85 |
+
normalization:
|
| 86 |
+
observation_modes:
|
| 87 |
+
observation.state: min_max
|
| 88 |
+
action_modes:
|
| 89 |
+
action: min_max
|
| 90 |
+
fps: 20
|
| 91 |
+
delta_timestamps:
|
| 92 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 93 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 94 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 95 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 96 |
+
action: '[i / 20 for i in range(16)]'
|
| 97 |
+
image_transforms:
|
| 98 |
+
enable: false
|
sta_peginsertionside_noisy/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:95149197c474d978c9c540c6011aa373f3ca750655d23c686527480e48a0fefc
|
| 3 |
+
size 93175182
|
sta_peginsertionside_noisy/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: true
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: PegInsertionSide-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: PegInsertionSide-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.hand_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 9
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 8
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
sta_stackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d714678729d554c791038f8a62d6099edfdedcebec87417f3abf67820b69eeb0
|
| 3 |
+
size 93175117
|
sta_stackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: StackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: StackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.hand_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 9
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 30
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 8
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
sta_stackcube_noisy/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef31875454bfd56a639d112ee74b16f7336ae05e5e5c70c0cfa1abf25b3dd3f0
|
| 3 |
+
size 93175116
|
sta_stackcube_noisy/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: true
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: StackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: StackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.hand_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 9
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 30
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 8
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
sta_tworobotstackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da45ef75d11ce0f92c8a193a6662a5d5cd1aa139f07a89f89fe92a1e46fd977c
|
| 3 |
+
size 93219132
|
sta_tworobotstackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: TwoRobotStackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: TwoRobotStackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.image: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.state: !!python/tuple
|
| 80 |
+
- 18
|
| 81 |
+
observation.privileged: !!python/tuple
|
| 82 |
+
- 40
|
| 83 |
+
output_shapes:
|
| 84 |
+
action: !!python/tuple
|
| 85 |
+
- 16
|
| 86 |
+
- 16
|
| 87 |
+
normalization:
|
| 88 |
+
observation_modes:
|
| 89 |
+
observation.state: min_max
|
| 90 |
+
action_modes:
|
| 91 |
+
action: min_max
|
| 92 |
+
fps: 20
|
| 93 |
+
delta_timestamps:
|
| 94 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 95 |
+
observation.image: '[i / 20 for i in range(16)]'
|
| 96 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 97 |
+
action: '[i / 20 for i in range(16)]'
|
| 98 |
+
image_transforms:
|
| 99 |
+
enable: false
|
sta_tworobotstackcube_noisy/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74b77a37d4f2c2ddeb23580ae48e1e89788c86e082666010733917800b5406ec
|
| 3 |
+
size 93219131
|
sta_tworobotstackcube_noisy/params/agent.yaml
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: true
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: TwoRobotStackCube-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: TwoRobotStackCube-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.image: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.state: !!python/tuple
|
| 80 |
+
- 18
|
| 81 |
+
observation.privileged: !!python/tuple
|
| 82 |
+
- 40
|
| 83 |
+
output_shapes:
|
| 84 |
+
action: !!python/tuple
|
| 85 |
+
- 16
|
| 86 |
+
- 16
|
| 87 |
+
normalization:
|
| 88 |
+
observation_modes:
|
| 89 |
+
observation.state: min_max
|
| 90 |
+
action_modes:
|
| 91 |
+
action: min_max
|
| 92 |
+
fps: 20
|
| 93 |
+
delta_timestamps:
|
| 94 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 95 |
+
observation.image: '[i / 20 for i in range(16)]'
|
| 96 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 97 |
+
action: '[i / 20 for i in range(16)]'
|
| 98 |
+
image_transforms:
|
| 99 |
+
enable: false
|
sta_unitreeg1transportbox/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba139bc6eef6088de70c5d67f1e97da247865c75db47bff8f76448b5b8cd8c76
|
| 3 |
+
size 93255978
|
sta_unitreeg1transportbox/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: false
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: UnitreeG1TransportBox-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: UnitreeG1TransportBox-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.head_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 25
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 25
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.head_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
sta_unitreeg1transportbox_noisy/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:275345602402e5826857b67fd9f5d1a43f66841a28b683c3bcf3bada3ebb01be
|
| 3 |
+
size 93255977
|
sta_unitreeg1transportbox_noisy/params/agent.yaml
ADDED
|
@@ -0,0 +1,104 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 50
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: ARMYPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_decoder: 512
|
| 17 |
+
n_decoder_layers: 4
|
| 18 |
+
n_decoder_heads: 8
|
| 19 |
+
use_rmsnorm: true
|
| 20 |
+
pre_norm: true
|
| 21 |
+
sa_att: true
|
| 22 |
+
ca_att: true
|
| 23 |
+
army_att: true
|
| 24 |
+
army_residual: false
|
| 25 |
+
army_norm: math
|
| 26 |
+
dropout: 0.0
|
| 27 |
+
dropout_residual: 0.0
|
| 28 |
+
action_horizon: 16
|
| 29 |
+
optimizer_kwargs:
|
| 30 |
+
eps: 1.0e-08
|
| 31 |
+
noise: true
|
| 32 |
+
preprocessor_class: Lerobot_2_Army
|
| 33 |
+
preprocessor_kwargs:
|
| 34 |
+
resize_images: !!python/tuple
|
| 35 |
+
- 94
|
| 36 |
+
- 94
|
| 37 |
+
normalize_images: true
|
| 38 |
+
tokenizer_kwargs:
|
| 39 |
+
model_template: qwen2-chat
|
| 40 |
+
num_image_token: 9
|
| 41 |
+
padding_max_length: 60
|
| 42 |
+
padding_side: right
|
| 43 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 44 |
+
observation_modes:
|
| 45 |
+
observation.state: min_max
|
| 46 |
+
action_modes:
|
| 47 |
+
action: min_max
|
| 48 |
+
overwrite_stats: false
|
| 49 |
+
stats: null
|
| 50 |
+
data_key_map:
|
| 51 |
+
observation.images.base_camera: cam1
|
| 52 |
+
observation.images.hand_camera: cam2
|
| 53 |
+
observation.images.head_camera: cam2
|
| 54 |
+
observation.images.image_side_1: cam1
|
| 55 |
+
observation.images.image_side_2: cam2
|
| 56 |
+
observation.images.image_wrist_1: cam3
|
| 57 |
+
observation.images.image_wrist_2: cam4
|
| 58 |
+
observation.top: cam1
|
| 59 |
+
image: cam1
|
| 60 |
+
wrist_image: cam2
|
| 61 |
+
observation.state: state
|
| 62 |
+
state: state
|
| 63 |
+
action: action
|
| 64 |
+
actions: action
|
| 65 |
+
task: UnitreeG1TransportBox-v1
|
| 66 |
+
env_cfg:
|
| 67 |
+
name: maniskill
|
| 68 |
+
task: UnitreeG1TransportBox-v1
|
| 69 |
+
dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
|
| 70 |
+
episodes: null
|
| 71 |
+
dataset_revision: v2.0
|
| 72 |
+
dataset_root: null
|
| 73 |
+
video_backend: pyav
|
| 74 |
+
input_shapes:
|
| 75 |
+
observation.images.base_camera: !!python/tuple
|
| 76 |
+
- 480
|
| 77 |
+
- 640
|
| 78 |
+
- 3
|
| 79 |
+
observation.images.head_camera: !!python/tuple
|
| 80 |
+
- 480
|
| 81 |
+
- 640
|
| 82 |
+
- 3
|
| 83 |
+
observation.state: !!python/tuple
|
| 84 |
+
- 25
|
| 85 |
+
observation.privileged: !!python/tuple
|
| 86 |
+
- 27
|
| 87 |
+
output_shapes:
|
| 88 |
+
action: !!python/tuple
|
| 89 |
+
- 16
|
| 90 |
+
- 25
|
| 91 |
+
normalization:
|
| 92 |
+
observation_modes:
|
| 93 |
+
observation.state: min_max
|
| 94 |
+
action_modes:
|
| 95 |
+
action: min_max
|
| 96 |
+
fps: 20
|
| 97 |
+
delta_timestamps:
|
| 98 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 99 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 100 |
+
observation.images.head_camera: '[i / 20 for i in range(16)]'
|
| 101 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 102 |
+
action: '[i / 20 for i in range(16)]'
|
| 103 |
+
image_transforms:
|
| 104 |
+
enable: false
|
tcn_peginsertionside/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed19d3a5e08c7de93c8525848d6be466c083504400fa90e115ebc4280152ab56
|
| 3 |
+
size 39797489
|
tcn_peginsertionside/params/agent.yaml
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: TCNPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: PegInsertionSide-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: PegInsertionSide-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.images.base_camera: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.images.hand_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.state: !!python/tuple
|
| 74 |
+
- 9
|
| 75 |
+
observation.privileged: !!python/tuple
|
| 76 |
+
- 27
|
| 77 |
+
output_shapes:
|
| 78 |
+
action: !!python/tuple
|
| 79 |
+
- 16
|
| 80 |
+
- 8
|
| 81 |
+
normalization:
|
| 82 |
+
observation_modes:
|
| 83 |
+
observation.state: min_max
|
| 84 |
+
action_modes:
|
| 85 |
+
action: min_max
|
| 86 |
+
fps: 20
|
| 87 |
+
delta_timestamps:
|
| 88 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 89 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 90 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 91 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 92 |
+
action: '[i / 20 for i in range(16)]'
|
| 93 |
+
image_transforms:
|
| 94 |
+
enable: false
|
tcn_stackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98e6b3af802bae37423955954a602d833351925e09bbe7d44e7bacbd7da70c2c
|
| 3 |
+
size 39797427
|
tcn_stackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: TCNPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: StackCube-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: StackCube-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.images.base_camera: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.images.hand_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.state: !!python/tuple
|
| 74 |
+
- 9
|
| 75 |
+
observation.privileged: !!python/tuple
|
| 76 |
+
- 30
|
| 77 |
+
output_shapes:
|
| 78 |
+
action: !!python/tuple
|
| 79 |
+
- 16
|
| 80 |
+
- 8
|
| 81 |
+
normalization:
|
| 82 |
+
observation_modes:
|
| 83 |
+
observation.state: min_max
|
| 84 |
+
action_modes:
|
| 85 |
+
action: min_max
|
| 86 |
+
fps: 20
|
| 87 |
+
delta_timestamps:
|
| 88 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 89 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 90 |
+
observation.images.hand_camera: '[i / 20 for i in range(16)]'
|
| 91 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 92 |
+
action: '[i / 20 for i in range(16)]'
|
| 93 |
+
image_transforms:
|
| 94 |
+
enable: false
|
tcn_tworobotstackcube/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb7c9a7d875b7552477079ed88cf8f96a99d91a41414b63d8e78ec5c3b3ab2c3
|
| 3 |
+
size 38774435
|
tcn_tworobotstackcube/params/agent.yaml
ADDED
|
@@ -0,0 +1,89 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: TCNPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: TwoRobotStackCube-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: TwoRobotStackCube-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.image: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.state: !!python/tuple
|
| 70 |
+
- 18
|
| 71 |
+
observation.privileged: !!python/tuple
|
| 72 |
+
- 40
|
| 73 |
+
output_shapes:
|
| 74 |
+
action: !!python/tuple
|
| 75 |
+
- 16
|
| 76 |
+
- 16
|
| 77 |
+
normalization:
|
| 78 |
+
observation_modes:
|
| 79 |
+
observation.state: min_max
|
| 80 |
+
action_modes:
|
| 81 |
+
action: min_max
|
| 82 |
+
fps: 20
|
| 83 |
+
delta_timestamps:
|
| 84 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 85 |
+
observation.image: '[i / 20 for i in range(16)]'
|
| 86 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 87 |
+
action: '[i / 20 for i in range(16)]'
|
| 88 |
+
image_transforms:
|
| 89 |
+
enable: false
|
tcn_unitreeg1transportbox/best_model.zip
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f64c9e6df0228a0b67418c62536ba2aa6a495c39728cc20fbade9832494b9ea5
|
| 3 |
+
size 39845585
|
tcn_unitreeg1transportbox/params/agent.yaml
ADDED
|
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
seed: 42
|
| 2 |
+
device: cuda:0
|
| 3 |
+
n_epochs: 50
|
| 4 |
+
batch_size: 16
|
| 5 |
+
gradient_accumulation_steps: 1
|
| 6 |
+
mixed_precision: 'no'
|
| 7 |
+
learning_rate: 8.0e-05
|
| 8 |
+
lr_scheduler: constant
|
| 9 |
+
ent_coef: 0.01
|
| 10 |
+
l2_coef: 0.01
|
| 11 |
+
weight_decay: 0
|
| 12 |
+
max_grad_norm: 1.0
|
| 13 |
+
agent_class: sl_agent.SL
|
| 14 |
+
policy: TCNPolicy
|
| 15 |
+
policy_kwargs:
|
| 16 |
+
dim_model: 512
|
| 17 |
+
final_ffn: true
|
| 18 |
+
action_horizon: 16
|
| 19 |
+
optimizer_kwargs:
|
| 20 |
+
eps: 1.0e-08
|
| 21 |
+
noise: false
|
| 22 |
+
preprocessor_class: Lerobot_2_Army
|
| 23 |
+
preprocessor_kwargs:
|
| 24 |
+
resize_images: !!python/tuple
|
| 25 |
+
- 94
|
| 26 |
+
- 94
|
| 27 |
+
normalize_images: true
|
| 28 |
+
tokenizer_kwargs:
|
| 29 |
+
model_template: qwen2-chat
|
| 30 |
+
num_image_token: 9
|
| 31 |
+
padding_max_length: 60
|
| 32 |
+
padding_side: right
|
| 33 |
+
prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
|
| 34 |
+
observation_modes:
|
| 35 |
+
observation.state: min_max
|
| 36 |
+
action_modes:
|
| 37 |
+
action: min_max
|
| 38 |
+
overwrite_stats: false
|
| 39 |
+
stats: null
|
| 40 |
+
data_key_map:
|
| 41 |
+
observation.images.base_camera: cam1
|
| 42 |
+
observation.images.hand_camera: cam2
|
| 43 |
+
observation.images.head_camera: cam2
|
| 44 |
+
observation.images.image_side_1: cam1
|
| 45 |
+
observation.images.image_side_2: cam2
|
| 46 |
+
observation.images.image_wrist_1: cam3
|
| 47 |
+
observation.images.image_wrist_2: cam4
|
| 48 |
+
observation.top: cam1
|
| 49 |
+
image: cam1
|
| 50 |
+
wrist_image: cam2
|
| 51 |
+
observation.state: state
|
| 52 |
+
state: state
|
| 53 |
+
action: action
|
| 54 |
+
actions: action
|
| 55 |
+
task: UnitreeG1TransportBox-v1
|
| 56 |
+
env_cfg:
|
| 57 |
+
name: maniskill
|
| 58 |
+
task: UnitreeG1TransportBox-v1
|
| 59 |
+
dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
|
| 60 |
+
episodes: null
|
| 61 |
+
dataset_revision: v2.0
|
| 62 |
+
dataset_root: null
|
| 63 |
+
video_backend: pyav
|
| 64 |
+
input_shapes:
|
| 65 |
+
observation.images.base_camera: !!python/tuple
|
| 66 |
+
- 480
|
| 67 |
+
- 640
|
| 68 |
+
- 3
|
| 69 |
+
observation.images.head_camera: !!python/tuple
|
| 70 |
+
- 480
|
| 71 |
+
- 640
|
| 72 |
+
- 3
|
| 73 |
+
observation.state: !!python/tuple
|
| 74 |
+
- 25
|
| 75 |
+
observation.privileged: !!python/tuple
|
| 76 |
+
- 27
|
| 77 |
+
output_shapes:
|
| 78 |
+
action: !!python/tuple
|
| 79 |
+
- 16
|
| 80 |
+
- 25
|
| 81 |
+
normalization:
|
| 82 |
+
observation_modes:
|
| 83 |
+
observation.state: min_max
|
| 84 |
+
action_modes:
|
| 85 |
+
action: min_max
|
| 86 |
+
fps: 20
|
| 87 |
+
delta_timestamps:
|
| 88 |
+
expert_mask: '[i / 20 for i in range(16)]'
|
| 89 |
+
observation.images.base_camera: '[i / 20 for i in range(16)]'
|
| 90 |
+
observation.images.head_camera: '[i / 20 for i in range(16)]'
|
| 91 |
+
observation.state: '[i / 20 for i in range(16)]'
|
| 92 |
+
action: '[i / 20 for i in range(16)]'
|
| 93 |
+
image_transforms:
|
| 94 |
+
enable: false
|