shuohsuan commited on
Commit
e03e4a1
·
verified ·
1 Parent(s): ad62281

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +162 -0
  2. config.json +69 -0
  3. model.safetensors +3 -0
  4. train_config.json +277 -0
README.md ADDED
@@ -0,0 +1,162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ datasets:
3
+ - shuohsuan/grasp_data_000_009
4
+ - shuohsuan/grasp_data_010_019
5
+ - shuohsuan/grasp_data_020_029
6
+ - shuohsuan/grasp_data_030_039
7
+ - shuohsuan/grasp_data_040_049
8
+ - shuohsuan/grasp_data_050_059
9
+ - shuohsuan/grasp_data_060_069
10
+ - shuohsuan/grasp_data_070_079
11
+ - shuohsuan/grasp_data_080_089
12
+ - shuohsuan/grasp_data_090_099
13
+ - shuohsuan/grasp_data_100_109
14
+ - shuohsuan/grasp_data_110_119
15
+ - shuohsuan/grasp_data_120_129
16
+ - shuohsuan/grasp_data_130_139
17
+ - shuohsuan/grasp_data_140_149
18
+ - shuohsuan/grasp_data_150_159
19
+ - shuohsuan/grasp_data_160_169
20
+ - shuohsuan/grasp_data_170_179
21
+ - shuohsuan/grasp_data_180_189
22
+ - shuohsuan/grasp_data_190_199
23
+ - shuohsuan/grasp_data_200_209
24
+ - shuohsuan/grasp_data_210_219
25
+ - shuohsuan/grasp_data_220_229
26
+ - shuohsuan/grasp_data_230_239
27
+ - shuohsuan/grasp_data_240_249
28
+ - shuohsuan/grasp_data_250_259
29
+ - shuohsuan/grasp_data_260_269
30
+ - shuohsuan/grasp_data_270_279
31
+ - shuohsuan/grasp_data_280_289
32
+ - shuohsuan/grasp_data_290_299
33
+ - shuohsuan/grasp_data_300_309
34
+ - shuohsuan/grasp_data_310_319
35
+ - shuohsuan/grasp_data_320_329
36
+ - shuohsuan/grasp_data_330_339
37
+ - shuohsuan/grasp_data_340_349
38
+ - shuohsuan/grasp_data_350_359
39
+ - shuohsuan/grasp_data_360_369
40
+ - shuohsuan/grasp_data_370_379
41
+ - shuohsuan/grasp_data_380_389
42
+ - shuohsuan/grasp_data_390_399
43
+ - shuohsuan/grasp_data_400_409
44
+ - shuohsuan/grasp_data_410_419
45
+ - shuohsuan/grasp_data_420_429
46
+ - shuohsuan/grasp_data_430_439
47
+ - shuohsuan/grasp_data_440_449
48
+ - shuohsuan/grasp_data_450_459
49
+ - shuohsuan/grasp_data_460_469
50
+ - shuohsuan/grasp_data_470_479
51
+ - shuohsuan/grasp_data_480_489
52
+ - shuohsuan/grasp_data_490_499
53
+ - shuohsuan/grasp_data_500_509
54
+ - shuohsuan/grasp_data_510_519
55
+ - shuohsuan/grasp_data_520_529
56
+ - shuohsuan/grasp_data_530_539
57
+ - shuohsuan/grasp_data_540_549
58
+ - shuohsuan/grasp_data_550_559
59
+ - shuohsuan/grasp_data_560_569
60
+ - shuohsuan/grasp_data_570_579
61
+ - shuohsuan/grasp_data_580_589
62
+ - shuohsuan/grasp_data_590_599
63
+ - shuohsuan/grasp_data_600_609
64
+ - shuohsuan/grasp_data_610_619
65
+ - shuohsuan/grasp_data_620_629
66
+ - shuohsuan/grasp_data_630_639
67
+ - shuohsuan/grasp_data_640_649
68
+ - shuohsuan/grasp_data_650_659
69
+ - shuohsuan/grasp_data_660_669
70
+ - shuohsuan/grasp_data_670_679
71
+ - shuohsuan/grasp_data_680_689
72
+ - shuohsuan/grasp_data_690_699
73
+ - shuohsuan/grasp_data_700_709
74
+ - shuohsuan/grasp_data_710_719
75
+ - shuohsuan/grasp_data_720_729
76
+ - shuohsuan/grasp_data_730_739
77
+ - shuohsuan/grasp_data_740_749
78
+ - shuohsuan/grasp_data_750_759
79
+ - shuohsuan/grasp_data_760_769
80
+ - shuohsuan/grasp_data_770_779
81
+ - shuohsuan/grasp_data_780_789
82
+ - shuohsuan/grasp_data_790_799
83
+ - shuohsuan/grasp_data_800_809
84
+ - shuohsuan/grasp_data_810_819
85
+ - shuohsuan/grasp_data_820_829
86
+ - shuohsuan/grasp_data_830_839
87
+ - shuohsuan/grasp_data_840_849
88
+ - shuohsuan/grasp_data_850_859
89
+ - shuohsuan/grasp_data_860_869
90
+ - shuohsuan/grasp_data_870_879
91
+ - shuohsuan/grasp_data_880_889
92
+ - shuohsuan/grasp_data_890_899
93
+ - shuohsuan/grasp_data_900_909
94
+ - shuohsuan/grasp_data_910_919
95
+ - shuohsuan/grasp_data_920_929
96
+ - shuohsuan/grasp_data_930_939
97
+ - shuohsuan/grasp_data_940_949
98
+ - shuohsuan/grasp_data_950_959
99
+ - shuohsuan/grasp_data_960_969
100
+ - shuohsuan/grasp_data_970_979
101
+ - shuohsuan/grasp_data_980_989
102
+ - shuohsuan/grasp_data_990_999
103
+ library_name: lerobot
104
+ license: apache-2.0
105
+ model_name: act
106
+ pipeline_tag: robotics
107
+ tags:
108
+ - lerobot
109
+ - robotics
110
+ - act
111
+ ---
112
+
113
+ # Model Card for act
114
+
115
+ <!-- Provide a quick summary of what the model is/does. -->
116
+
117
+
118
+ [Action Chunking with Transformers (ACT)](https://huggingface.co/papers/2304.13705) is an imitation-learning method that predicts short action chunks instead of single steps. It learns from teleoperated data and often achieves high success rates.
119
+
120
+
121
+ This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
122
+ See the full documentation at [LeRobot Docs](https://huggingface.co/docs/lerobot/index).
123
+
124
+ ---
125
+
126
+ ## How to Get Started with the Model
127
+
128
+ For a complete walkthrough, see the [training guide](https://huggingface.co/docs/lerobot/il_robots#train-a-policy).
129
+ Below is the short version on how to train and run inference/eval:
130
+
131
+ ### Train from scratch
132
+
133
+ ```bash
134
+ python -m lerobot.scripts.train \
135
+ --dataset.repo_id=${HF_USER}/<dataset> \
136
+ --policy.type=act \
137
+ --output_dir=outputs/train/<desired_policy_repo_id> \
138
+ --job_name=lerobot_training \
139
+ --policy.device=cuda \
140
+ --policy.repo_id=${HF_USER}/<desired_policy_repo_id>
141
+ --wandb.enable=true
142
+ ```
143
+
144
+ *Writes checkpoints to `outputs/train/<desired_policy_repo_id>/checkpoints/`.*
145
+
146
+ ### Evaluate the policy/run inference
147
+
148
+ ```bash
149
+ python -m lerobot.record \
150
+ --robot.type=so100_follower \
151
+ --dataset.repo_id=<hf_user>/eval_<dataset> \
152
+ --policy.path=<hf_user>/<desired_policy_repo_id> \
153
+ --episodes=10
154
+ ```
155
+
156
+ Prefix the dataset repo with **eval\_** and supply `--policy.path` pointing to a local or hub checkpoint.
157
+
158
+ ---
159
+
160
+ ## Model Details
161
+
162
+ * **License:** apache-2.0
config.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "type": "act",
3
+ "n_obs_steps": 1,
4
+ "normalization_mapping": {
5
+ "VISUAL": "MEAN_STD",
6
+ "STATE": "MEAN_STD",
7
+ "ACTION": "MEAN_STD"
8
+ },
9
+ "input_features": {
10
+ "observation.state": {
11
+ "type": "STATE",
12
+ "shape": [
13
+ 6
14
+ ]
15
+ },
16
+ "observation.images.top": {
17
+ "type": "VISUAL",
18
+ "shape": [
19
+ 3,
20
+ 480,
21
+ 640
22
+ ]
23
+ },
24
+ "observation.images.wrist": {
25
+ "type": "VISUAL",
26
+ "shape": [
27
+ 3,
28
+ 480,
29
+ 640
30
+ ]
31
+ }
32
+ },
33
+ "output_features": {
34
+ "action": {
35
+ "type": "ACTION",
36
+ "shape": [
37
+ 6
38
+ ]
39
+ }
40
+ },
41
+ "device": "cuda",
42
+ "use_amp": false,
43
+ "push_to_hub": true,
44
+ "repo_id": "shuohsuan/act_multi_grasp_rand",
45
+ "private": null,
46
+ "tags": null,
47
+ "license": null,
48
+ "chunk_size": 100,
49
+ "n_action_steps": 100,
50
+ "vision_backbone": "resnet18",
51
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
52
+ "replace_final_stride_with_dilation": false,
53
+ "pre_norm": false,
54
+ "dim_model": 512,
55
+ "n_heads": 8,
56
+ "dim_feedforward": 3200,
57
+ "feedforward_activation": "relu",
58
+ "n_encoder_layers": 4,
59
+ "n_decoder_layers": 1,
60
+ "use_vae": true,
61
+ "latent_dim": 32,
62
+ "n_vae_encoder_layers": 4,
63
+ "temporal_ensemble_coeff": null,
64
+ "dropout": 0.1,
65
+ "kl_weight": 10.0,
66
+ "optimizer_lr": 1e-05,
67
+ "optimizer_weight_decay": 0.0001,
68
+ "optimizer_lr_backbone": 1e-05
69
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fa97ba678fe606641633882db95d104b68fcdd59d73caa0a1b07f887b98621d
3
+ size 206701064
train_config.json ADDED
@@ -0,0 +1,277 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": {
3
+ "repo_id": [
4
+ "shuohsuan/grasp_data_000_009",
5
+ "shuohsuan/grasp_data_010_019",
6
+ "shuohsuan/grasp_data_020_029",
7
+ "shuohsuan/grasp_data_030_039",
8
+ "shuohsuan/grasp_data_040_049",
9
+ "shuohsuan/grasp_data_050_059",
10
+ "shuohsuan/grasp_data_060_069",
11
+ "shuohsuan/grasp_data_070_079",
12
+ "shuohsuan/grasp_data_080_089",
13
+ "shuohsuan/grasp_data_090_099",
14
+ "shuohsuan/grasp_data_100_109",
15
+ "shuohsuan/grasp_data_110_119",
16
+ "shuohsuan/grasp_data_120_129",
17
+ "shuohsuan/grasp_data_130_139",
18
+ "shuohsuan/grasp_data_140_149",
19
+ "shuohsuan/grasp_data_150_159",
20
+ "shuohsuan/grasp_data_160_169",
21
+ "shuohsuan/grasp_data_170_179",
22
+ "shuohsuan/grasp_data_180_189",
23
+ "shuohsuan/grasp_data_190_199",
24
+ "shuohsuan/grasp_data_200_209",
25
+ "shuohsuan/grasp_data_210_219",
26
+ "shuohsuan/grasp_data_220_229",
27
+ "shuohsuan/grasp_data_230_239",
28
+ "shuohsuan/grasp_data_240_249",
29
+ "shuohsuan/grasp_data_250_259",
30
+ "shuohsuan/grasp_data_260_269",
31
+ "shuohsuan/grasp_data_270_279",
32
+ "shuohsuan/grasp_data_280_289",
33
+ "shuohsuan/grasp_data_290_299",
34
+ "shuohsuan/grasp_data_300_309",
35
+ "shuohsuan/grasp_data_310_319",
36
+ "shuohsuan/grasp_data_320_329",
37
+ "shuohsuan/grasp_data_330_339",
38
+ "shuohsuan/grasp_data_340_349",
39
+ "shuohsuan/grasp_data_350_359",
40
+ "shuohsuan/grasp_data_360_369",
41
+ "shuohsuan/grasp_data_370_379",
42
+ "shuohsuan/grasp_data_380_389",
43
+ "shuohsuan/grasp_data_390_399",
44
+ "shuohsuan/grasp_data_400_409",
45
+ "shuohsuan/grasp_data_410_419",
46
+ "shuohsuan/grasp_data_420_429",
47
+ "shuohsuan/grasp_data_430_439",
48
+ "shuohsuan/grasp_data_440_449",
49
+ "shuohsuan/grasp_data_450_459",
50
+ "shuohsuan/grasp_data_460_469",
51
+ "shuohsuan/grasp_data_470_479",
52
+ "shuohsuan/grasp_data_480_489",
53
+ "shuohsuan/grasp_data_490_499",
54
+ "shuohsuan/grasp_data_500_509",
55
+ "shuohsuan/grasp_data_510_519",
56
+ "shuohsuan/grasp_data_520_529",
57
+ "shuohsuan/grasp_data_530_539",
58
+ "shuohsuan/grasp_data_540_549",
59
+ "shuohsuan/grasp_data_550_559",
60
+ "shuohsuan/grasp_data_560_569",
61
+ "shuohsuan/grasp_data_570_579",
62
+ "shuohsuan/grasp_data_580_589",
63
+ "shuohsuan/grasp_data_590_599",
64
+ "shuohsuan/grasp_data_600_609",
65
+ "shuohsuan/grasp_data_610_619",
66
+ "shuohsuan/grasp_data_620_629",
67
+ "shuohsuan/grasp_data_630_639",
68
+ "shuohsuan/grasp_data_640_649",
69
+ "shuohsuan/grasp_data_650_659",
70
+ "shuohsuan/grasp_data_660_669",
71
+ "shuohsuan/grasp_data_670_679",
72
+ "shuohsuan/grasp_data_680_689",
73
+ "shuohsuan/grasp_data_690_699",
74
+ "shuohsuan/grasp_data_700_709",
75
+ "shuohsuan/grasp_data_710_719",
76
+ "shuohsuan/grasp_data_720_729",
77
+ "shuohsuan/grasp_data_730_739",
78
+ "shuohsuan/grasp_data_740_749",
79
+ "shuohsuan/grasp_data_750_759",
80
+ "shuohsuan/grasp_data_760_769",
81
+ "shuohsuan/grasp_data_770_779",
82
+ "shuohsuan/grasp_data_780_789",
83
+ "shuohsuan/grasp_data_790_799",
84
+ "shuohsuan/grasp_data_800_809",
85
+ "shuohsuan/grasp_data_810_819",
86
+ "shuohsuan/grasp_data_820_829",
87
+ "shuohsuan/grasp_data_830_839",
88
+ "shuohsuan/grasp_data_840_849",
89
+ "shuohsuan/grasp_data_850_859",
90
+ "shuohsuan/grasp_data_860_869",
91
+ "shuohsuan/grasp_data_870_879",
92
+ "shuohsuan/grasp_data_880_889",
93
+ "shuohsuan/grasp_data_890_899",
94
+ "shuohsuan/grasp_data_900_909",
95
+ "shuohsuan/grasp_data_910_919",
96
+ "shuohsuan/grasp_data_920_929",
97
+ "shuohsuan/grasp_data_930_939",
98
+ "shuohsuan/grasp_data_940_949",
99
+ "shuohsuan/grasp_data_950_959",
100
+ "shuohsuan/grasp_data_960_969",
101
+ "shuohsuan/grasp_data_970_979",
102
+ "shuohsuan/grasp_data_980_989",
103
+ "shuohsuan/grasp_data_990_999"
104
+ ],
105
+ "repo_idx": 100,
106
+ "root": null,
107
+ "episodes": null,
108
+ "image_transforms": {
109
+ "enable": false,
110
+ "max_num_transforms": 3,
111
+ "random_order": false,
112
+ "tfs": {
113
+ "brightness": {
114
+ "weight": 1.0,
115
+ "type": "ColorJitter",
116
+ "kwargs": {
117
+ "brightness": [
118
+ 0.8,
119
+ 1.2
120
+ ]
121
+ }
122
+ },
123
+ "contrast": {
124
+ "weight": 1.0,
125
+ "type": "ColorJitter",
126
+ "kwargs": {
127
+ "contrast": [
128
+ 0.8,
129
+ 1.2
130
+ ]
131
+ }
132
+ },
133
+ "saturation": {
134
+ "weight": 1.0,
135
+ "type": "ColorJitter",
136
+ "kwargs": {
137
+ "saturation": [
138
+ 0.5,
139
+ 1.5
140
+ ]
141
+ }
142
+ },
143
+ "hue": {
144
+ "weight": 1.0,
145
+ "type": "ColorJitter",
146
+ "kwargs": {
147
+ "hue": [
148
+ -0.05,
149
+ 0.05
150
+ ]
151
+ }
152
+ },
153
+ "sharpness": {
154
+ "weight": 1.0,
155
+ "type": "SharpnessJitter",
156
+ "kwargs": {
157
+ "sharpness": [
158
+ 0.5,
159
+ 1.5
160
+ ]
161
+ }
162
+ }
163
+ }
164
+ },
165
+ "revision": null,
166
+ "use_imagenet_stats": true,
167
+ "video_backend": "torchcodec"
168
+ },
169
+ "env": null,
170
+ "policy": {
171
+ "type": "act",
172
+ "n_obs_steps": 1,
173
+ "normalization_mapping": {
174
+ "VISUAL": "MEAN_STD",
175
+ "STATE": "MEAN_STD",
176
+ "ACTION": "MEAN_STD"
177
+ },
178
+ "input_features": {
179
+ "observation.state": {
180
+ "type": "STATE",
181
+ "shape": [
182
+ 6
183
+ ]
184
+ },
185
+ "observation.images.top": {
186
+ "type": "VISUAL",
187
+ "shape": [
188
+ 3,
189
+ 480,
190
+ 640
191
+ ]
192
+ },
193
+ "observation.images.wrist": {
194
+ "type": "VISUAL",
195
+ "shape": [
196
+ 3,
197
+ 480,
198
+ 640
199
+ ]
200
+ }
201
+ },
202
+ "output_features": {
203
+ "action": {
204
+ "type": "ACTION",
205
+ "shape": [
206
+ 6
207
+ ]
208
+ }
209
+ },
210
+ "device": "cuda",
211
+ "use_amp": false,
212
+ "push_to_hub": true,
213
+ "repo_id": "shuohsuan/act_multi_grasp_rand",
214
+ "private": null,
215
+ "tags": null,
216
+ "license": null,
217
+ "chunk_size": 100,
218
+ "n_action_steps": 100,
219
+ "vision_backbone": "resnet18",
220
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
221
+ "replace_final_stride_with_dilation": false,
222
+ "pre_norm": false,
223
+ "dim_model": 512,
224
+ "n_heads": 8,
225
+ "dim_feedforward": 3200,
226
+ "feedforward_activation": "relu",
227
+ "n_encoder_layers": 4,
228
+ "n_decoder_layers": 1,
229
+ "use_vae": true,
230
+ "latent_dim": 32,
231
+ "n_vae_encoder_layers": 4,
232
+ "temporal_ensemble_coeff": null,
233
+ "dropout": 0.1,
234
+ "kl_weight": 10.0,
235
+ "optimizer_lr": 1e-05,
236
+ "optimizer_weight_decay": 0.0001,
237
+ "optimizer_lr_backbone": 1e-05
238
+ },
239
+ "output_dir": "/mnt/storage/shuohsuan/train/act_multi_grasp_rand",
240
+ "job_name": "act_grasp_rand",
241
+ "resume": false,
242
+ "seed": 1000,
243
+ "num_workers": 4,
244
+ "batch_size": 64,
245
+ "steps": 200000,
246
+ "eval_freq": 20000,
247
+ "log_freq": 200,
248
+ "save_checkpoint": true,
249
+ "save_freq": 20000,
250
+ "use_policy_training_preset": true,
251
+ "optimizer": {
252
+ "type": "adamw",
253
+ "lr": 1e-05,
254
+ "weight_decay": 0.0001,
255
+ "grad_clip_norm": 10.0,
256
+ "betas": [
257
+ 0.9,
258
+ 0.999
259
+ ],
260
+ "eps": 1e-08
261
+ },
262
+ "scheduler": null,
263
+ "eval": {
264
+ "n_episodes": 50,
265
+ "batch_size": 50,
266
+ "use_async_envs": false
267
+ },
268
+ "wandb": {
269
+ "enable": false,
270
+ "disable_artifact": false,
271
+ "project": "lerobot",
272
+ "entity": null,
273
+ "notes": null,
274
+ "run_id": null,
275
+ "mode": null
276
+ }
277
+ }