johnMinelli commited on
Commit
d8f2c24
·
verified ·
1 Parent(s): 742f928
Files changed (48) hide show
  1. cross_peginsertionside/best_model.zip +3 -0
  2. cross_peginsertionside/params/agent.yaml +104 -0
  3. cross_stackcube/best_model.zip +3 -0
  4. cross_stackcube/params/agent.yaml +104 -0
  5. cross_tworobotstackcube/best_model.zip +3 -0
  6. cross_tworobotstackcube/params/agent.yaml +99 -0
  7. cross_unitreeg1transportbox/best_model.zip +3 -0
  8. cross_unitreeg1transportbox/params/agent.yaml +104 -0
  9. lstm_peginsertionside/best_model.zip +3 -0
  10. lstm_peginsertionside/params/agent.yaml +94 -0
  11. lstm_stackcube/best_model.zip +3 -0
  12. lstm_stackcube/params/agent.yaml +94 -0
  13. lstm_tworobotstackcube/best_model.zip +3 -0
  14. lstm_tworobotstackcube/params/agent.yaml +89 -0
  15. lstm_unitreeg1transportbox/best_model.zip +3 -0
  16. lstm_unitreeg1transportbox/params/agent.yaml +94 -0
  17. none_peginsertionside/best_model.zip +3 -0
  18. none_peginsertionside/params/agent.yaml +104 -0
  19. none_stackcube/best_model.zip +3 -0
  20. none_stackcube/params/agent.yaml +98 -0
  21. none_tworobotstackcube/best_model.zip +3 -0
  22. none_tworobotstackcube/params/agent.yaml +99 -0
  23. none_unitreeg1transportbox/best_model.zip +3 -0
  24. none_unitreeg1transportbox/params/agent.yaml +104 -0
  25. sta_peginsertionside/best_model.zip +3 -0
  26. sta_peginsertionside/params/agent.yaml +98 -0
  27. sta_peginsertionside_noisy/best_model.zip +3 -0
  28. sta_peginsertionside_noisy/params/agent.yaml +104 -0
  29. sta_stackcube/best_model.zip +3 -0
  30. sta_stackcube/params/agent.yaml +104 -0
  31. sta_stackcube_noisy/best_model.zip +3 -0
  32. sta_stackcube_noisy/params/agent.yaml +104 -0
  33. sta_tworobotstackcube/best_model.zip +3 -0
  34. sta_tworobotstackcube/params/agent.yaml +99 -0
  35. sta_tworobotstackcube_noisy/best_model.zip +3 -0
  36. sta_tworobotstackcube_noisy/params/agent.yaml +99 -0
  37. sta_unitreeg1transportbox/best_model.zip +3 -0
  38. sta_unitreeg1transportbox/params/agent.yaml +104 -0
  39. sta_unitreeg1transportbox_noisy/best_model.zip +3 -0
  40. sta_unitreeg1transportbox_noisy/params/agent.yaml +104 -0
  41. tcn_peginsertionside/best_model.zip +3 -0
  42. tcn_peginsertionside/params/agent.yaml +94 -0
  43. tcn_stackcube/best_model.zip +3 -0
  44. tcn_stackcube/params/agent.yaml +94 -0
  45. tcn_tworobotstackcube/best_model.zip +3 -0
  46. tcn_tworobotstackcube/params/agent.yaml +89 -0
  47. tcn_unitreeg1transportbox/best_model.zip +3 -0
  48. tcn_unitreeg1transportbox/params/agent.yaml +94 -0
cross_peginsertionside/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4236675d6537384de34ae6b135dbc3704e16feea0e1de27cb46723ceb0caab6a
3
+ size 93175179
cross_peginsertionside/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: PegInsertionSide-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: PegInsertionSide-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.hand_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 9
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 8
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
cross_stackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eda55ea9e1f8307ee644bd07811ecfa905b19768cf8af8da8825ea015ad98c21
3
+ size 93175118
cross_stackcube/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: StackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: StackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.hand_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 9
85
+ observation.privileged: !!python/tuple
86
+ - 30
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 8
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
cross_tworobotstackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41ca41133e0f04e72bf55945157c3adf1191e52a018134a4c8155b07d80df57e
3
+ size 93219135
cross_tworobotstackcube/params/agent.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: TwoRobotStackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: TwoRobotStackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.image: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.state: !!python/tuple
80
+ - 18
81
+ observation.privileged: !!python/tuple
82
+ - 40
83
+ output_shapes:
84
+ action: !!python/tuple
85
+ - 16
86
+ - 16
87
+ normalization:
88
+ observation_modes:
89
+ observation.state: min_max
90
+ action_modes:
91
+ action: min_max
92
+ fps: 20
93
+ delta_timestamps:
94
+ expert_mask: '[i / 20 for i in range(16)]'
95
+ observation.image: '[i / 20 for i in range(16)]'
96
+ observation.state: '[i / 20 for i in range(16)]'
97
+ action: '[i / 20 for i in range(16)]'
98
+ image_transforms:
99
+ enable: false
cross_unitreeg1transportbox/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a72cbc84bd0d33c7bb3dbb7a3858e05a7014b8b93a369c03699909f5c335a3a
3
+ size 93255978
cross_unitreeg1transportbox/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: UnitreeG1TransportBox-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: UnitreeG1TransportBox-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.head_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 25
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 25
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.head_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
lstm_peginsertionside/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:481b2a2417fd1ac3aa8691f7ba906efe587dd0fc67e9231a509b4d883d828714
3
+ size 42676885
lstm_peginsertionside/params/agent.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: LSTMPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: PegInsertionSide-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: PegInsertionSide-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.images.base_camera: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.images.hand_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.state: !!python/tuple
74
+ - 9
75
+ observation.privileged: !!python/tuple
76
+ - 27
77
+ output_shapes:
78
+ action: !!python/tuple
79
+ - 16
80
+ - 8
81
+ normalization:
82
+ observation_modes:
83
+ observation.state: min_max
84
+ action_modes:
85
+ action: min_max
86
+ fps: 20
87
+ delta_timestamps:
88
+ expert_mask: '[i / 20 for i in range(16)]'
89
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
90
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
91
+ observation.state: '[i / 20 for i in range(16)]'
92
+ action: '[i / 20 for i in range(16)]'
93
+ image_transforms:
94
+ enable: false
lstm_stackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3863c1d750feb2d79aa18c36d2d7c895f24d9e9dd48b1d6c45747f98ec459665
3
+ size 42676824
lstm_stackcube/params/agent.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: LSTMPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: StackCube-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: StackCube-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.images.base_camera: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.images.hand_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.state: !!python/tuple
74
+ - 9
75
+ observation.privileged: !!python/tuple
76
+ - 30
77
+ output_shapes:
78
+ action: !!python/tuple
79
+ - 16
80
+ - 8
81
+ normalization:
82
+ observation_modes:
83
+ observation.state: min_max
84
+ action_modes:
85
+ action: min_max
86
+ fps: 20
87
+ delta_timestamps:
88
+ expert_mask: '[i / 20 for i in range(16)]'
89
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
90
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
91
+ observation.state: '[i / 20 for i in range(16)]'
92
+ action: '[i / 20 for i in range(16)]'
93
+ image_transforms:
94
+ enable: false
lstm_tworobotstackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60c1de3094b962f8eaf3c7d9faf96e59e9eb92431850cc59d3798c9f5b4b6bfd
3
+ size 41653831
lstm_tworobotstackcube/params/agent.yaml ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: LSTMPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: TwoRobotStackCube-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: TwoRobotStackCube-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.image: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.state: !!python/tuple
70
+ - 18
71
+ observation.privileged: !!python/tuple
72
+ - 40
73
+ output_shapes:
74
+ action: !!python/tuple
75
+ - 16
76
+ - 16
77
+ normalization:
78
+ observation_modes:
79
+ observation.state: min_max
80
+ action_modes:
81
+ action: min_max
82
+ fps: 20
83
+ delta_timestamps:
84
+ expert_mask: '[i / 20 for i in range(16)]'
85
+ observation.image: '[i / 20 for i in range(16)]'
86
+ observation.state: '[i / 20 for i in range(16)]'
87
+ action: '[i / 20 for i in range(16)]'
88
+ image_transforms:
89
+ enable: false
lstm_unitreeg1transportbox/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f2f44037adaebbebfa4cfd8f3ccdf07d068616a1475763bb49bc53964af02be
3
+ size 42724986
lstm_unitreeg1transportbox/params/agent.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: LSTMPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: UnitreeG1TransportBox-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: UnitreeG1TransportBox-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.images.base_camera: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.images.head_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.state: !!python/tuple
74
+ - 25
75
+ observation.privileged: !!python/tuple
76
+ - 27
77
+ output_shapes:
78
+ action: !!python/tuple
79
+ - 16
80
+ - 25
81
+ normalization:
82
+ observation_modes:
83
+ observation.state: min_max
84
+ action_modes:
85
+ action: min_max
86
+ fps: 20
87
+ delta_timestamps:
88
+ expert_mask: '[i / 20 for i in range(16)]'
89
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
90
+ observation.images.head_camera: '[i / 20 for i in range(16)]'
91
+ observation.state: '[i / 20 for i in range(16)]'
92
+ action: '[i / 20 for i in range(16)]'
93
+ image_transforms:
94
+ enable: false
none_peginsertionside/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91f462488160c8089ccd2e7071f566291b1a24f0fba9748a749682b9797d7ffc
3
+ size 93175181
none_peginsertionside/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: false
22
+ ca_att: false
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: PegInsertionSide-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: PegInsertionSide-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.hand_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 9
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 8
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
none_stackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c991aac3d9207510a2a021c9d6c3b93c17ea6a015c3bfb393830eee59ee9d277
3
+ size 93175121
none_stackcube/params/agent.yaml ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 200
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: TransformerPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_flag: false
22
+ ca_flag: false
23
+ sta_flag: false
24
+ sta_residual: false
25
+ sta_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Agent
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ observation_modes:
39
+ observation.state: min_max
40
+ action_modes:
41
+ action: min_max
42
+ overwrite_stats: false
43
+ stats: null
44
+ data_key_map:
45
+ observation.images.base_camera: cam1
46
+ observation.images.hand_camera: cam2
47
+ observation.images.head_camera: cam2
48
+ observation.images.image_side_1: cam1
49
+ observation.images.image_side_2: cam2
50
+ observation.images.image_wrist_1: cam3
51
+ observation.images.image_wrist_2: cam4
52
+ observation.top: cam1
53
+ image: cam1
54
+ wrist_image: cam2
55
+ observation.state: state
56
+ state: state
57
+ action: action
58
+ actions: action
59
+ task: StackCube-v1
60
+ env_cfg:
61
+ name: maniskill
62
+ task: StackCube-v1
63
+ dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
64
+ episodes: null
65
+ dataset_revision: v2.0
66
+ dataset_root: null
67
+ video_backend: pyav
68
+ input_shapes:
69
+ observation.images.base_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.images.hand_camera: !!python/tuple
74
+ - 480
75
+ - 640
76
+ - 3
77
+ observation.state: !!python/tuple
78
+ - 9
79
+ observation.privileged: !!python/tuple
80
+ - 30
81
+ output_shapes:
82
+ action: !!python/tuple
83
+ - 16
84
+ - 8
85
+ normalization:
86
+ observation_modes:
87
+ observation.state: min_max
88
+ action_modes:
89
+ action: min_max
90
+ fps: 20
91
+ delta_timestamps:
92
+ expert_mask: '[i / 20 for i in range(16)]'
93
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
94
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
95
+ observation.state: '[i / 20 for i in range(16)]'
96
+ action: '[i / 20 for i in range(16)]'
97
+ image_transforms:
98
+ enable: false
none_tworobotstackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38bef25c60cb946966c5c56ea2d881437e4e2dcf3bb82aaa3da0b21e62c08c3f
3
+ size 93219134
none_tworobotstackcube/params/agent.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: false
22
+ ca_att: false
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: TwoRobotStackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: TwoRobotStackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.image: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.state: !!python/tuple
80
+ - 18
81
+ observation.privileged: !!python/tuple
82
+ - 40
83
+ output_shapes:
84
+ action: !!python/tuple
85
+ - 16
86
+ - 16
87
+ normalization:
88
+ observation_modes:
89
+ observation.state: min_max
90
+ action_modes:
91
+ action: min_max
92
+ fps: 20
93
+ delta_timestamps:
94
+ expert_mask: '[i / 20 for i in range(16)]'
95
+ observation.image: '[i / 20 for i in range(16)]'
96
+ observation.state: '[i / 20 for i in range(16)]'
97
+ action: '[i / 20 for i in range(16)]'
98
+ image_transforms:
99
+ enable: false
none_unitreeg1transportbox/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0274a2dee4c158384796bc95b982f4194839e004951a7ea39759a56c933889f5
3
+ size 93255981
none_unitreeg1transportbox/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: false
22
+ ca_att: false
23
+ army_att: false
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: UnitreeG1TransportBox-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: UnitreeG1TransportBox-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.head_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 25
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 25
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.head_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
sta_peginsertionside/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e4814f84dab65674c120a46a2fb252580538f57f43bc8323849a7fc62348c41
3
+ size 93175183
sta_peginsertionside/params/agent.yaml ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 200
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: TransformerPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_flag: true
22
+ ca_flag: true
23
+ sta_flag: true
24
+ sta_residual: false
25
+ sta_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: true
32
+ preprocessor_class: Lerobot_2_Agent
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ observation_modes:
39
+ observation.state: min_max
40
+ action_modes:
41
+ action: min_max
42
+ overwrite_stats: false
43
+ stats: null
44
+ data_key_map:
45
+ observation.images.base_camera: cam1
46
+ observation.images.hand_camera: cam2
47
+ observation.images.head_camera: cam2
48
+ observation.images.image_side_1: cam1
49
+ observation.images.image_side_2: cam2
50
+ observation.images.image_wrist_1: cam3
51
+ observation.images.image_wrist_2: cam4
52
+ observation.top: cam1
53
+ image: cam1
54
+ wrist_image: cam2
55
+ observation.state: state
56
+ state: state
57
+ action: action
58
+ actions: action
59
+ task: PegInsertionSide-v1
60
+ env_cfg:
61
+ name: maniskill
62
+ task: PegInsertionSide-v1
63
+ dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
64
+ episodes: null
65
+ dataset_revision: v2.0
66
+ dataset_root: null
67
+ video_backend: pyav
68
+ input_shapes:
69
+ observation.images.base_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.images.hand_camera: !!python/tuple
74
+ - 480
75
+ - 640
76
+ - 3
77
+ observation.state: !!python/tuple
78
+ - 9
79
+ observation.privileged: !!python/tuple
80
+ - 27
81
+ output_shapes:
82
+ action: !!python/tuple
83
+ - 16
84
+ - 8
85
+ normalization:
86
+ observation_modes:
87
+ observation.state: min_max
88
+ action_modes:
89
+ action: min_max
90
+ fps: 20
91
+ delta_timestamps:
92
+ expert_mask: '[i / 20 for i in range(16)]'
93
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
94
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
95
+ observation.state: '[i / 20 for i in range(16)]'
96
+ action: '[i / 20 for i in range(16)]'
97
+ image_transforms:
98
+ enable: false
sta_peginsertionside_noisy/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95149197c474d978c9c540c6011aa373f3ca750655d23c686527480e48a0fefc
3
+ size 93175182
sta_peginsertionside_noisy/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: true
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: PegInsertionSide-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: PegInsertionSide-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.hand_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 9
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 8
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
sta_stackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d714678729d554c791038f8a62d6099edfdedcebec87417f3abf67820b69eeb0
3
+ size 93175117
sta_stackcube/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: StackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: StackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.hand_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 9
85
+ observation.privileged: !!python/tuple
86
+ - 30
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 8
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
sta_stackcube_noisy/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef31875454bfd56a639d112ee74b16f7336ae05e5e5c70c0cfa1abf25b3dd3f0
3
+ size 93175116
sta_stackcube_noisy/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: true
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: StackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: StackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.hand_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 9
85
+ observation.privileged: !!python/tuple
86
+ - 30
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 8
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
sta_tworobotstackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da45ef75d11ce0f92c8a193a6662a5d5cd1aa139f07a89f89fe92a1e46fd977c
3
+ size 93219132
sta_tworobotstackcube/params/agent.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: TwoRobotStackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: TwoRobotStackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.image: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.state: !!python/tuple
80
+ - 18
81
+ observation.privileged: !!python/tuple
82
+ - 40
83
+ output_shapes:
84
+ action: !!python/tuple
85
+ - 16
86
+ - 16
87
+ normalization:
88
+ observation_modes:
89
+ observation.state: min_max
90
+ action_modes:
91
+ action: min_max
92
+ fps: 20
93
+ delta_timestamps:
94
+ expert_mask: '[i / 20 for i in range(16)]'
95
+ observation.image: '[i / 20 for i in range(16)]'
96
+ observation.state: '[i / 20 for i in range(16)]'
97
+ action: '[i / 20 for i in range(16)]'
98
+ image_transforms:
99
+ enable: false
sta_tworobotstackcube_noisy/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74b77a37d4f2c2ddeb23580ae48e1e89788c86e082666010733917800b5406ec
3
+ size 93219131
sta_tworobotstackcube_noisy/params/agent.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: true
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: TwoRobotStackCube-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: TwoRobotStackCube-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.image: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.state: !!python/tuple
80
+ - 18
81
+ observation.privileged: !!python/tuple
82
+ - 40
83
+ output_shapes:
84
+ action: !!python/tuple
85
+ - 16
86
+ - 16
87
+ normalization:
88
+ observation_modes:
89
+ observation.state: min_max
90
+ action_modes:
91
+ action: min_max
92
+ fps: 20
93
+ delta_timestamps:
94
+ expert_mask: '[i / 20 for i in range(16)]'
95
+ observation.image: '[i / 20 for i in range(16)]'
96
+ observation.state: '[i / 20 for i in range(16)]'
97
+ action: '[i / 20 for i in range(16)]'
98
+ image_transforms:
99
+ enable: false
sta_unitreeg1transportbox/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba139bc6eef6088de70c5d67f1e97da247865c75db47bff8f76448b5b8cd8c76
3
+ size 93255978
sta_unitreeg1transportbox/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: false
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: UnitreeG1TransportBox-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: UnitreeG1TransportBox-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.head_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 25
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 25
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.head_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
sta_unitreeg1transportbox_noisy/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:275345602402e5826857b67fd9f5d1a43f66841a28b683c3bcf3bada3ebb01be
3
+ size 93255977
sta_unitreeg1transportbox_noisy/params/agent.yaml ADDED
@@ -0,0 +1,104 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 50
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: ARMYPolicy
15
+ policy_kwargs:
16
+ dim_decoder: 512
17
+ n_decoder_layers: 4
18
+ n_decoder_heads: 8
19
+ use_rmsnorm: true
20
+ pre_norm: true
21
+ sa_att: true
22
+ ca_att: true
23
+ army_att: true
24
+ army_residual: false
25
+ army_norm: math
26
+ dropout: 0.0
27
+ dropout_residual: 0.0
28
+ action_horizon: 16
29
+ optimizer_kwargs:
30
+ eps: 1.0e-08
31
+ noise: true
32
+ preprocessor_class: Lerobot_2_Army
33
+ preprocessor_kwargs:
34
+ resize_images: !!python/tuple
35
+ - 94
36
+ - 94
37
+ normalize_images: true
38
+ tokenizer_kwargs:
39
+ model_template: qwen2-chat
40
+ num_image_token: 9
41
+ padding_max_length: 60
42
+ padding_side: right
43
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
44
+ observation_modes:
45
+ observation.state: min_max
46
+ action_modes:
47
+ action: min_max
48
+ overwrite_stats: false
49
+ stats: null
50
+ data_key_map:
51
+ observation.images.base_camera: cam1
52
+ observation.images.hand_camera: cam2
53
+ observation.images.head_camera: cam2
54
+ observation.images.image_side_1: cam1
55
+ observation.images.image_side_2: cam2
56
+ observation.images.image_wrist_1: cam3
57
+ observation.images.image_wrist_2: cam4
58
+ observation.top: cam1
59
+ image: cam1
60
+ wrist_image: cam2
61
+ observation.state: state
62
+ state: state
63
+ action: action
64
+ actions: action
65
+ task: UnitreeG1TransportBox-v1
66
+ env_cfg:
67
+ name: maniskill
68
+ task: UnitreeG1TransportBox-v1
69
+ dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
70
+ episodes: null
71
+ dataset_revision: v2.0
72
+ dataset_root: null
73
+ video_backend: pyav
74
+ input_shapes:
75
+ observation.images.base_camera: !!python/tuple
76
+ - 480
77
+ - 640
78
+ - 3
79
+ observation.images.head_camera: !!python/tuple
80
+ - 480
81
+ - 640
82
+ - 3
83
+ observation.state: !!python/tuple
84
+ - 25
85
+ observation.privileged: !!python/tuple
86
+ - 27
87
+ output_shapes:
88
+ action: !!python/tuple
89
+ - 16
90
+ - 25
91
+ normalization:
92
+ observation_modes:
93
+ observation.state: min_max
94
+ action_modes:
95
+ action: min_max
96
+ fps: 20
97
+ delta_timestamps:
98
+ expert_mask: '[i / 20 for i in range(16)]'
99
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
100
+ observation.images.head_camera: '[i / 20 for i in range(16)]'
101
+ observation.state: '[i / 20 for i in range(16)]'
102
+ action: '[i / 20 for i in range(16)]'
103
+ image_transforms:
104
+ enable: false
tcn_peginsertionside/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed19d3a5e08c7de93c8525848d6be466c083504400fa90e115ebc4280152ab56
3
+ size 39797489
tcn_peginsertionside/params/agent.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: TCNPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: PegInsertionSide-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: PegInsertionSide-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_PegInsertionSide-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.images.base_camera: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.images.hand_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.state: !!python/tuple
74
+ - 9
75
+ observation.privileged: !!python/tuple
76
+ - 27
77
+ output_shapes:
78
+ action: !!python/tuple
79
+ - 16
80
+ - 8
81
+ normalization:
82
+ observation_modes:
83
+ observation.state: min_max
84
+ action_modes:
85
+ action: min_max
86
+ fps: 20
87
+ delta_timestamps:
88
+ expert_mask: '[i / 20 for i in range(16)]'
89
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
90
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
91
+ observation.state: '[i / 20 for i in range(16)]'
92
+ action: '[i / 20 for i in range(16)]'
93
+ image_transforms:
94
+ enable: false
tcn_stackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98e6b3af802bae37423955954a602d833351925e09bbe7d44e7bacbd7da70c2c
3
+ size 39797427
tcn_stackcube/params/agent.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: TCNPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: StackCube-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: StackCube-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_StackCube-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.images.base_camera: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.images.hand_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.state: !!python/tuple
74
+ - 9
75
+ observation.privileged: !!python/tuple
76
+ - 30
77
+ output_shapes:
78
+ action: !!python/tuple
79
+ - 16
80
+ - 8
81
+ normalization:
82
+ observation_modes:
83
+ observation.state: min_max
84
+ action_modes:
85
+ action: min_max
86
+ fps: 20
87
+ delta_timestamps:
88
+ expert_mask: '[i / 20 for i in range(16)]'
89
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
90
+ observation.images.hand_camera: '[i / 20 for i in range(16)]'
91
+ observation.state: '[i / 20 for i in range(16)]'
92
+ action: '[i / 20 for i in range(16)]'
93
+ image_transforms:
94
+ enable: false
tcn_tworobotstackcube/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb7c9a7d875b7552477079ed88cf8f96a99d91a41414b63d8e78ec5c3b3ab2c3
3
+ size 38774435
tcn_tworobotstackcube/params/agent.yaml ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: TCNPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: TwoRobotStackCube-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: TwoRobotStackCube-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_TwoRobotStackCube-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.image: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.state: !!python/tuple
70
+ - 18
71
+ observation.privileged: !!python/tuple
72
+ - 40
73
+ output_shapes:
74
+ action: !!python/tuple
75
+ - 16
76
+ - 16
77
+ normalization:
78
+ observation_modes:
79
+ observation.state: min_max
80
+ action_modes:
81
+ action: min_max
82
+ fps: 20
83
+ delta_timestamps:
84
+ expert_mask: '[i / 20 for i in range(16)]'
85
+ observation.image: '[i / 20 for i in range(16)]'
86
+ observation.state: '[i / 20 for i in range(16)]'
87
+ action: '[i / 20 for i in range(16)]'
88
+ image_transforms:
89
+ enable: false
tcn_unitreeg1transportbox/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f64c9e6df0228a0b67418c62536ba2aa6a495c39728cc20fbade9832494b9ea5
3
+ size 39845585
tcn_unitreeg1transportbox/params/agent.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 42
2
+ device: cuda:0
3
+ n_epochs: 50
4
+ batch_size: 16
5
+ gradient_accumulation_steps: 1
6
+ mixed_precision: 'no'
7
+ learning_rate: 8.0e-05
8
+ lr_scheduler: constant
9
+ ent_coef: 0.01
10
+ l2_coef: 0.01
11
+ weight_decay: 0
12
+ max_grad_norm: 1.0
13
+ agent_class: sl_agent.SL
14
+ policy: TCNPolicy
15
+ policy_kwargs:
16
+ dim_model: 512
17
+ final_ffn: true
18
+ action_horizon: 16
19
+ optimizer_kwargs:
20
+ eps: 1.0e-08
21
+ noise: false
22
+ preprocessor_class: Lerobot_2_Army
23
+ preprocessor_kwargs:
24
+ resize_images: !!python/tuple
25
+ - 94
26
+ - 94
27
+ normalize_images: true
28
+ tokenizer_kwargs:
29
+ model_template: qwen2-chat
30
+ num_image_token: 9
31
+ padding_max_length: 60
32
+ padding_side: right
33
+ prompt_generator: FixedPromptGenerator("Insert the peg into the hole.")
34
+ observation_modes:
35
+ observation.state: min_max
36
+ action_modes:
37
+ action: min_max
38
+ overwrite_stats: false
39
+ stats: null
40
+ data_key_map:
41
+ observation.images.base_camera: cam1
42
+ observation.images.hand_camera: cam2
43
+ observation.images.head_camera: cam2
44
+ observation.images.image_side_1: cam1
45
+ observation.images.image_side_2: cam2
46
+ observation.images.image_wrist_1: cam3
47
+ observation.images.image_wrist_2: cam4
48
+ observation.top: cam1
49
+ image: cam1
50
+ wrist_image: cam2
51
+ observation.state: state
52
+ state: state
53
+ action: action
54
+ actions: action
55
+ task: UnitreeG1TransportBox-v1
56
+ env_cfg:
57
+ name: maniskill
58
+ task: UnitreeG1TransportBox-v1
59
+ dataset_repo_id: johnMinelli/ManiSkill_UnitreeG1TransportBox-v1_recovery
60
+ episodes: null
61
+ dataset_revision: v2.0
62
+ dataset_root: null
63
+ video_backend: pyav
64
+ input_shapes:
65
+ observation.images.base_camera: !!python/tuple
66
+ - 480
67
+ - 640
68
+ - 3
69
+ observation.images.head_camera: !!python/tuple
70
+ - 480
71
+ - 640
72
+ - 3
73
+ observation.state: !!python/tuple
74
+ - 25
75
+ observation.privileged: !!python/tuple
76
+ - 27
77
+ output_shapes:
78
+ action: !!python/tuple
79
+ - 16
80
+ - 25
81
+ normalization:
82
+ observation_modes:
83
+ observation.state: min_max
84
+ action_modes:
85
+ action: min_max
86
+ fps: 20
87
+ delta_timestamps:
88
+ expert_mask: '[i / 20 for i in range(16)]'
89
+ observation.images.base_camera: '[i / 20 for i in range(16)]'
90
+ observation.images.head_camera: '[i / 20 for i in range(16)]'
91
+ observation.state: '[i / 20 for i in range(16)]'
92
+ action: '[i / 20 for i in range(16)]'
93
+ image_transforms:
94
+ enable: false