Timsty commited on
Commit
8ec58e6
·
verified ·
1 Parent(s): 7212da6

Upload folder using huggingface_hub

Browse files
0424_QwenPI_13tasks_actionstate_50k/config.json ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "run_id": "0424_QwenPI_13tasks_actionstate_50k",
3
+ "run_root_dir": "./runs",
4
+ "seed": 42,
5
+ "trackers": [
6
+ "jsonl",
7
+ "wandb"
8
+ ],
9
+ "wandb_entity": "timsty",
10
+ "wandb_project": "vla_jepa",
11
+ "is_debug": false,
12
+ "framework": {
13
+ "name": "QwenPI",
14
+ "qwenvl": {
15
+ "base_vlm": "/mnt/data/fangyu/model/Qwen/Qwen3-VL-2B-Instruct",
16
+ "attn_implementation": "flash_attention_2",
17
+ "vl_hidden_dim": 2048,
18
+ "num_data_tokens": 32
19
+ },
20
+ "action_model": {
21
+ "dataset_vocab_size": 256,
22
+ "hidden_size": 1024,
23
+ "add_pos_embed": true,
24
+ "max_seq_len": 1024,
25
+ "action_dim": 37,
26
+ "state_dim": 74,
27
+ "future_action_window_size": 14,
28
+ "action_horizon": 15,
29
+ "past_action_window_size": 0,
30
+ "noise_beta_alpha": 1.5,
31
+ "noise_beta_beta": 1.0,
32
+ "noise_s": 0.999,
33
+ "num_timestep_buckets": 1000,
34
+ "num_inference_timesteps": 10,
35
+ "num_target_vision_tokens": 32,
36
+ "diffusion_model_cfg": {
37
+ "dropout": 0.2,
38
+ "final_dropout": true,
39
+ "interleave_self_attention": true,
40
+ "norm_type": "ada_norm",
41
+ "output_dim": 1024,
42
+ "positional_embeddings": null
43
+ }
44
+ }
45
+ },
46
+ "datasets": {
47
+ "vla_data": {
48
+ "dataset_py": "lerobot_datasets",
49
+ "data_root_dir": "/mnt/data/fangyu/dataset/IPEC-COMMUNITY",
50
+ "data_mix": "cross_embodiedment_13tasks",
51
+ "CoT_prompt": "Task: {instruction}. What are the next 15 actions to take?",
52
+ "default_image_resolution": [
53
+ 3,
54
+ 224,
55
+ 224
56
+ ],
57
+ "per_device_batch_size": 64,
58
+ "load_all_data_for_training": true,
59
+ "obs": [
60
+ "image_0"
61
+ ],
62
+ "image_size": [
63
+ 224,
64
+ 224
65
+ ],
66
+ "video_backend": "torchcodec",
67
+ "load_video": true,
68
+ "chunk_size": 15,
69
+ "state_use_action_chunk": false,
70
+ "num_history_steps": 0,
71
+ "include_state": true
72
+ }
73
+ },
74
+ "trainer": {
75
+ "epochs": 100,
76
+ "max_train_steps": 50000,
77
+ "num_warmup_steps": 5000,
78
+ "num_stable_steps": 0,
79
+ "save_interval": 5000,
80
+ "eval_interval": 50,
81
+ "max_checkpoints_to_keep": 20,
82
+ "repeated_diffusion_steps": 1,
83
+ "learning_rate": {
84
+ "base": 5e-05,
85
+ "qwen_vl_interface": 5e-05,
86
+ "action_model": 5e-05
87
+ },
88
+ "lr_scheduler_type": "warmup_stable_cosine",
89
+ "scheduler_specific_kwargs": {
90
+ "min_lr_ratio": 0.001
91
+ },
92
+ "freeze_modules": "",
93
+ "warmup_ratio": 0.1,
94
+ "weight_decay": 0.0,
95
+ "logging_frequency": 10,
96
+ "gradient_clipping": 5.0,
97
+ "gradient_accumulation_steps": 1,
98
+ "optimizer": {
99
+ "name": "AdamW",
100
+ "betas": [
101
+ 0.9,
102
+ 0.95
103
+ ],
104
+ "eps": 1e-08,
105
+ "weight_decay": 1e-08
106
+ },
107
+ "is_resume": false,
108
+ "resume_epoch": null,
109
+ "resume_step": null,
110
+ "enable_gradient_checkpointing": true,
111
+ "enable_mixed_precision_training": true
112
+ },
113
+ "output_dir": "./runs/0424_QwenPI_13tasks_actionstate_50k"
114
+ }
0424_QwenPI_13tasks_actionstate_50k/config.yaml ADDED
@@ -0,0 +1,97 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_id: 0424_QwenPI_13tasks_actionstate_50k
2
+ run_root_dir: ./runs
3
+ seed: 42
4
+ trackers:
5
+ - jsonl
6
+ - wandb
7
+ wandb_entity: timsty
8
+ wandb_project: vla_jepa
9
+ is_debug: false
10
+ framework:
11
+ name: QwenPI
12
+ qwenvl:
13
+ base_vlm: /mnt/data/fangyu/model/Qwen/Qwen3-VL-2B-Instruct
14
+ attn_implementation: flash_attention_2
15
+ vl_hidden_dim: 2048
16
+ num_data_tokens: 32
17
+ action_model:
18
+ dataset_vocab_size: 256
19
+ hidden_size: 1024
20
+ add_pos_embed: true
21
+ max_seq_len: 1024
22
+ action_dim: 37
23
+ state_dim: 74
24
+ future_action_window_size: 14
25
+ action_horizon: 15
26
+ past_action_window_size: 0
27
+ noise_beta_alpha: 1.5
28
+ noise_beta_beta: 1.0
29
+ noise_s: 0.999
30
+ num_timestep_buckets: 1000
31
+ num_inference_timesteps: 10
32
+ num_target_vision_tokens: 32
33
+ diffusion_model_cfg:
34
+ dropout: 0.2
35
+ final_dropout: true
36
+ interleave_self_attention: true
37
+ norm_type: ada_norm
38
+ output_dim: 1024
39
+ positional_embeddings: null
40
+ datasets:
41
+ vla_data:
42
+ dataset_py: lerobot_datasets
43
+ data_root_dir: /mnt/data/fangyu/dataset/IPEC-COMMUNITY
44
+ data_mix: cross_embodiedment_13tasks
45
+ CoT_prompt: 'Task: {instruction}. What are the next 15 actions to take?'
46
+ default_image_resolution:
47
+ - 3
48
+ - 224
49
+ - 224
50
+ per_device_batch_size: 64
51
+ load_all_data_for_training: true
52
+ obs:
53
+ - image_0
54
+ image_size:
55
+ - 224
56
+ - 224
57
+ video_backend: torchcodec
58
+ load_video: true
59
+ chunk_size: 15
60
+ state_use_action_chunk: false
61
+ num_history_steps: 0
62
+ include_state: true
63
+ trainer:
64
+ epochs: 100
65
+ max_train_steps: 50000
66
+ num_warmup_steps: 5000
67
+ num_stable_steps: 0
68
+ save_interval: 5000
69
+ eval_interval: 50
70
+ max_checkpoints_to_keep: 20
71
+ repeated_diffusion_steps: 1
72
+ learning_rate:
73
+ base: 5.0e-05
74
+ qwen_vl_interface: 5.0e-05
75
+ action_model: 5.0e-05
76
+ lr_scheduler_type: warmup_stable_cosine
77
+ scheduler_specific_kwargs:
78
+ min_lr_ratio: 0.001
79
+ freeze_modules: ''
80
+ warmup_ratio: 0.1
81
+ weight_decay: 0.0
82
+ logging_frequency: 10
83
+ gradient_clipping: 5.0
84
+ gradient_accumulation_steps: 1
85
+ optimizer:
86
+ name: AdamW
87
+ betas:
88
+ - 0.9
89
+ - 0.95
90
+ eps: 1.0e-08
91
+ weight_decay: 1.0e-08
92
+ is_resume: false
93
+ resume_epoch: null
94
+ resume_step: null
95
+ enable_gradient_checkpointing: true
96
+ enable_mixed_precision_training: true
97
+ output_dir: ./runs/0424_QwenPI_13tasks_actionstate_50k
0424_QwenPI_13tasks_actionstate_50k/dataset_statistics.json ADDED
@@ -0,0 +1,682 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "franka": {
3
+ "action": {
4
+ "mean": [
5
+ 0.028950385935604575,
6
+ 0.03594802748411894,
7
+ -0.040578972548246384,
8
+ -0.00018153275595977897,
9
+ 0.002509436290711164,
10
+ -0.0015515198931097987,
11
+ 0.2097945421934128
12
+ ],
13
+ "std": [
14
+ 0.22410766487652278,
15
+ 0.24305199620930756,
16
+ 0.2951965321738853,
17
+ 0.02554494745114589,
18
+ 0.04195688852172731,
19
+ 0.04913475126163131,
20
+ 0.40719537354982976
21
+ ],
22
+ "max": [
23
+ 0.9375,
24
+ 0.9375,
25
+ 0.9375,
26
+ 0.3557142913341522,
27
+ 0.375,
28
+ 0.375,
29
+ 1.0
30
+ ],
31
+ "min": [
32
+ -0.9375,
33
+ -0.9375,
34
+ -0.9375,
35
+ -0.2582142949104309,
36
+ -0.375,
37
+ -0.3675000071525574,
38
+ 0.0
39
+ ],
40
+ "q01": [
41
+ -0.8785714507102966,
42
+ -0.8758928775787354,
43
+ -0.9375,
44
+ -0.1510714292526245,
45
+ -0.20678570866584778,
46
+ -0.2742857038974762,
47
+ 0.0
48
+ ],
49
+ "q99": [
50
+ 0.9375,
51
+ 0.9107142686843872,
52
+ 0.9375,
53
+ 0.20357142388820648,
54
+ 0.26357144117355347,
55
+ 0.375,
56
+ 1.0
57
+ ],
58
+ "mask": [
59
+ true,
60
+ true,
61
+ true,
62
+ true,
63
+ true,
64
+ true,
65
+ false
66
+ ]
67
+ },
68
+ "state": {
69
+ "mean": [
70
+ -0.019559418968856337,
71
+ 0.01475747274234891,
72
+ 0.3156160995364189,
73
+ 1.1908778190612794,
74
+ -0.05669147819280625,
75
+ -0.047077450156211856,
76
+ 0.010574408061802388,
77
+ -0.010662052407860756
78
+ ],
79
+ "std": [
80
+ 0.07142409265581258,
81
+ 0.097293833441406,
82
+ 0.45653463024572627,
83
+ 1.4755118780976493,
84
+ 0.5249547346172574,
85
+ 0.21261447615523038,
86
+ 0.01589982024424912,
87
+ 0.015944802785650813
88
+ ],
89
+ "max": [
90
+ 0.21031762659549713,
91
+ 0.39128610491752625,
92
+ 1.3660105466842651,
93
+ 3.6714255809783936,
94
+ 3.560650587081909,
95
+ 1.386339545249939,
96
+ 0.04233968257904053,
97
+ 0.0013633022317662835
98
+ ],
99
+ "min": [
100
+ -0.4828203022480011,
101
+ -0.3255046010017395,
102
+ 0.008128180168569088,
103
+ 0.35277295112609863,
104
+ -3.641430377960205,
105
+ -1.842738389968872,
106
+ -0.0013586411951109767,
107
+ -0.042040832340717316
108
+ ],
109
+ "q01": [
110
+ -0.42401049643754957,
111
+ -0.2838300323486328,
112
+ 0.009925739830359817,
113
+ 1.3085840785503386,
114
+ -2.886677579879761,
115
+ -1.1599004411697387,
116
+ 0.001503719249740243,
117
+ -0.040336399003863335
118
+ ],
119
+ "q99": [
120
+ 0.1530261474847791,
121
+ 0.3629165390133857,
122
+ 1.2910678112506866,
123
+ 3.303542451858519,
124
+ 2.7496529006957933,
125
+ 0.6893712210655194,
126
+ 0.040610933862626555,
127
+ -0.0015016929572448147
128
+ ]
129
+ },
130
+ "num_transitions": 273465,
131
+ "num_trajectories": 1693
132
+ },
133
+ "gr1": {
134
+ "action": {
135
+ "mean": [
136
+ -0.06503768935799599,
137
+ 0.1402852401137352,
138
+ -0.027576334401965143,
139
+ -0.7251276493072509,
140
+ 0.07538121624384077,
141
+ 0.0311446987092495,
142
+ -0.0006102971732616395,
143
+ -0.1556453585624695,
144
+ -0.17398847192525863,
145
+ 0.09801423102617265,
146
+ -0.7746159434318542,
147
+ 0.21945589482784272,
148
+ 0.05856966972351074,
149
+ 0.14407617151737215,
150
+ -0.04729328155517579,
151
+ -0.04729328155517579,
152
+ -0.04729328155517579,
153
+ -0.04729328155517579,
154
+ -0.09458656311035157,
155
+ 0.30000000000000004,
156
+ -0.16327507942914965,
157
+ -0.16327507942914965,
158
+ -0.16327507942914965,
159
+ -0.16327507942914965,
160
+ -0.3265501588582993,
161
+ 1.5000000000000002,
162
+ 0.004927502572536469,
163
+ 0.0010833685897523536,
164
+ -0.00044836528250016274
165
+ ],
166
+ "std": [
167
+ 0.20562330785235147,
168
+ 0.18647844645723213,
169
+ 0.13514553802530443,
170
+ 0.765678360428597,
171
+ 0.20251337668667177,
172
+ 0.16959756731031508,
173
+ 0.19710131907015732,
174
+ 0.4583574896238878,
175
+ 0.27460068635203594,
176
+ 0.3014025883171815,
177
+ 0.9046809346526231,
178
+ 0.4397149950522067,
179
+ 0.29622449978942395,
180
+ 0.45108890314809014,
181
+ 0.47196951455091185,
182
+ 0.47196951455091185,
183
+ 0.47196951455091185,
184
+ 0.47196951455091185,
185
+ 0.9439390291018237,
186
+ 0.9,
187
+ 1.0480660811801392,
188
+ 1.0480660811801392,
189
+ 1.0480660811801392,
190
+ 1.0480660811801392,
191
+ 2.0961321623602784,
192
+ 1.4999999999999998,
193
+ 0.036936757396854626,
194
+ 0.012072528210758757,
195
+ 0.007232476061257436
196
+ ],
197
+ "max": [
198
+ 1.2965171337127686,
199
+ 1.069582223892212,
200
+ 0.6721073985099792,
201
+ -0.00036245581577531993,
202
+ 1.404510259628296,
203
+ 1.4991986751556396,
204
+ 1.320265293121338,
205
+ 1.4943703413009644,
206
+ 0.00015122668992262334,
207
+ 1.5548107624053955,
208
+ 5.365318065742031e-05,
209
+ 2.501049041748047,
210
+ 1.4930087327957153,
211
+ 1.4891765117645264,
212
+ 1.5,
213
+ 1.5,
214
+ 1.5,
215
+ 1.5,
216
+ 3.0,
217
+ 3.0,
218
+ 1.5,
219
+ 1.5,
220
+ 1.5,
221
+ 1.5,
222
+ 3.0,
223
+ 3.0,
224
+ 0.3233739137649536,
225
+ 0.16282705962657928,
226
+ 0.4328489303588867
227
+ ],
228
+ "min": [
229
+ -1.2668161392211914,
230
+ -0.00042632038821466267,
231
+ -1.3582642078399658,
232
+ -2.776721477508545,
233
+ -1.6229861974716187,
234
+ -1.31162691116333,
235
+ -1.1806696653366089,
236
+ -2.101841926574707,
237
+ -1.509853482246399,
238
+ -1.2852329015731812,
239
+ -2.78891658782959,
240
+ -0.9951868653297424,
241
+ -1.49818754196167,
242
+ -1.4881112575531006,
243
+ -1.5,
244
+ -1.5,
245
+ -1.5,
246
+ -1.5,
247
+ -3.0,
248
+ 0.0,
249
+ -1.5,
250
+ -1.5,
251
+ -1.5,
252
+ -1.5,
253
+ -3.0,
254
+ 3.0,
255
+ -0.29814863204956055,
256
+ -0.3523012101650238,
257
+ -0.09862830489873886
258
+ ],
259
+ "q01": [
260
+ -1.1944766759872436,
261
+ -4.301190131172918e-07,
262
+ -0.7498355388641358,
263
+ -2.5581901550292967,
264
+ -0.6824928283691406,
265
+ -0.8841829299926758,
266
+ -1.0078708410263062,
267
+ -1.6597670578956605,
268
+ -1.226578596830368,
269
+ -0.9258902847766877,
270
+ -2.6987613677978515,
271
+ -0.8498974800109863,
272
+ -1.0853091955184937,
273
+ -1.0854953002929688,
274
+ -1.5,
275
+ -1.5,
276
+ -1.5,
277
+ -1.5,
278
+ -3.0,
279
+ 0.0,
280
+ -1.5,
281
+ -1.5,
282
+ -1.5,
283
+ -1.5,
284
+ -3.0,
285
+ 3.0,
286
+ -0.1551497459411621,
287
+ -0.04802883893251419,
288
+ -0.029186927154660224
289
+ ],
290
+ "q99": [
291
+ 1.0110889196395876,
292
+ 0.9781616687774661,
293
+ 0.46411060094833406,
294
+ -0.07979833036661146,
295
+ 1.0625922203063969,
296
+ 0.9605619907379178,
297
+ 0.6082226157188424,
298
+ 1.1673259019851685,
299
+ -2.7766001403513115e-06,
300
+ 1.0872023344039914,
301
+ -0.05551127571612597,
302
+ 1.9727541685104366,
303
+ 1.0421148896217345,
304
+ 1.4869407570362092,
305
+ 1.5,
306
+ 1.5,
307
+ 1.5,
308
+ 1.5,
309
+ 3.0,
310
+ 3.0,
311
+ 1.5,
312
+ 1.5,
313
+ 1.5,
314
+ 1.5,
315
+ 3.0,
316
+ 3.0,
317
+ 0.2753815710544586,
318
+ 0.06614580899477027,
319
+ 0.013670806447044017
320
+ ],
321
+ "mask": [
322
+ true,
323
+ true,
324
+ true,
325
+ true,
326
+ true,
327
+ true,
328
+ true,
329
+ true,
330
+ true,
331
+ true,
332
+ true,
333
+ true,
334
+ true,
335
+ true,
336
+ true,
337
+ true,
338
+ true,
339
+ true,
340
+ true,
341
+ true,
342
+ true,
343
+ true,
344
+ true,
345
+ true,
346
+ true,
347
+ true,
348
+ true,
349
+ true,
350
+ true
351
+ ]
352
+ },
353
+ "state": {
354
+ "mean": [
355
+ -0.06540636196732522,
356
+ 0.14223336279392243,
357
+ -0.02882793508470059,
358
+ -0.7281232118606568,
359
+ 0.07631409014575184,
360
+ 0.03485768660902977,
361
+ -0.0018693804740905805,
362
+ -0.15062302350997925,
363
+ -0.17422722429037094,
364
+ 0.10088010430335999,
365
+ -0.7751174092292785,
366
+ 0.21422418504953386,
367
+ 0.056977791339159006,
368
+ 0.1301754331216216,
369
+ 0.0444428395247087,
370
+ 0.046001738880295316,
371
+ 0.04305497270543129,
372
+ 0.04596460912143812,
373
+ 0.010766410198993982,
374
+ 0.174838250502944,
375
+ 0.2807944118976593,
376
+ 0.2625684827566147,
377
+ 0.24885019063949584,
378
+ 0.2602905809879303,
379
+ 0.0419048547744751,
380
+ 0.8312440872192383,
381
+ 0.004883934883400798,
382
+ 8.523006690666076e-05,
383
+ -6.207618571352216e-05
384
+ ],
385
+ "std": [
386
+ 0.20013891174318804,
387
+ 0.18784022709302264,
388
+ 0.13399923214695403,
389
+ 0.7673781334859416,
390
+ 0.1990098070412684,
391
+ 0.16736959256657702,
392
+ 0.19155714110140948,
393
+ 0.4472930058630781,
394
+ 0.26891556144795553,
395
+ 0.28930308542693634,
396
+ 0.8909602741089023,
397
+ 0.43545203501049284,
398
+ 0.2820895843302683,
399
+ 0.41341088988690194,
400
+ 0.24419357713232692,
401
+ 0.22780756672400648,
402
+ 0.21366731203921618,
403
+ 0.2305132558900519,
404
+ 0.06863410938203367,
405
+ 0.5112184050495793,
406
+ 0.5159579892170897,
407
+ 0.47904712336208155,
408
+ 0.45710343758297267,
409
+ 0.47342494976461513,
410
+ 0.13166977346516295,
411
+ 0.8450399122937896,
412
+ 0.034949910387869945,
413
+ 0.011174551728270072,
414
+ 0.00744905569932275
415
+ ],
416
+ "max": [
417
+ 1.254090428352356,
418
+ 1.0467604398727417,
419
+ 0.6428823471069336,
420
+ 0.0017068678280338645,
421
+ 1.3265025615692139,
422
+ 1.4839727878570557,
423
+ 1.1649909019470215,
424
+ 1.4408859014511108,
425
+ 0.0030245338566601276,
426
+ 1.529702067375183,
427
+ 0.0012778707314282656,
428
+ 2.4572627544403076,
429
+ 1.3810820579528809,
430
+ 1.3259196281433105,
431
+ 1.7941447496414185,
432
+ 1.7346926927566528,
433
+ 2.032738208770752,
434
+ 1.8508540391921997,
435
+ 1.3105334043502808,
436
+ 2.0280985832214355,
437
+ 2.1240122318267822,
438
+ 1.7788946628570557,
439
+ 2.984133005142212,
440
+ 2.44663405418396,
441
+ 1.2877141237258911,
442
+ 2.037182092666626,
443
+ 0.30236849188804626,
444
+ 0.1535278707742691,
445
+ 0.38705629110336304
446
+ ],
447
+ "min": [
448
+ -1.2302747964859009,
449
+ -0.008526407182216644,
450
+ -1.3281980752944946,
451
+ -2.5072484016418457,
452
+ -1.5798313617706299,
453
+ -1.1906307935714722,
454
+ -1.0882562398910522,
455
+ -2.059584379196167,
456
+ -1.475722312927246,
457
+ -1.2510409355163574,
458
+ -2.5155985355377197,
459
+ -0.9702507257461548,
460
+ -1.463935375213623,
461
+ -1.2635116577148438,
462
+ -1.1052463054656982,
463
+ -0.8339442014694214,
464
+ -1.2814871072769165,
465
+ -1.6386417150497437,
466
+ -0.816240131855011,
467
+ -0.5184589624404907,
468
+ -1.224429726600647,
469
+ -0.9850000739097595,
470
+ -0.9763456583023071,
471
+ -0.500698447227478,
472
+ -0.7500660419464111,
473
+ -0.03356735035777092,
474
+ -0.26449069380760193,
475
+ -0.3266247510910034,
476
+ -0.09658436477184296
477
+ ],
478
+ "q01": [
479
+ -1.1889611959457398,
480
+ -0.0009903528727591038,
481
+ -0.7342327952384948,
482
+ -2.4300240993499758,
483
+ -0.6584946513175964,
484
+ -0.8250447034835815,
485
+ -0.9737806677818298,
486
+ -1.6477210569381713,
487
+ -1.2134740138053894,
488
+ -0.8785631865262985,
489
+ -2.505193281173706,
490
+ -0.8399241447448731,
491
+ -1.0055391049385072,
492
+ -0.9640253639221191,
493
+ -0.47676344215869904,
494
+ -0.08676981404423714,
495
+ -0.14494537323713302,
496
+ -0.059164867363870145,
497
+ -0.1558390498161316,
498
+ -0.02249552313238381,
499
+ -0.0051496786996722225,
500
+ -0.005549988709390163,
501
+ -0.006174665316939354,
502
+ -0.005817336589097976,
503
+ -0.5121413707733155,
504
+ 0.3231884375214577,
505
+ -0.1299474745988846,
506
+ -0.045216087996959684,
507
+ -0.030235426500439644
508
+ ],
509
+ "q99": [
510
+ 0.9937156438827516,
511
+ 0.9744037270545968,
512
+ 0.4551989555358894,
513
+ -0.09210347831249224,
514
+ 1.0528851509094246,
515
+ 0.9591211795806898,
516
+ 0.5920819044113171,
517
+ 1.1361155986785891,
518
+ 0.0001814767369069183,
519
+ 1.052486894130706,
520
+ -0.049791696146131215,
521
+ 1.9595401525497436,
522
+ 0.9932814061641682,
523
+ 1.241852431297302,
524
+ 1.502415704727173,
525
+ 1.5030960321426392,
526
+ 1.4880860090255776,
527
+ 1.5015064239501954,
528
+ 0.6326038002967835,
529
+ 1.884292006492615,
530
+ 1.5134866952896122,
531
+ 1.5681370496749878,
532
+ 2.706826210021973,
533
+ 1.7132962703704837,
534
+ 0.8768314361572273,
535
+ 1.832364867925644,
536
+ 0.2745771288871766,
537
+ 0.06204778626561166,
538
+ 0.04224991366267195
539
+ ]
540
+ },
541
+ "num_transitions": 248956,
542
+ "num_trajectories": 1000
543
+ },
544
+ "real_world_franka": {
545
+ "action": {
546
+ "mean": [
547
+ 0.0018022622913122178,
548
+ 0.00866750255227089,
549
+ -0.0023813677951693537,
550
+ 0.006971974670886994,
551
+ -0.00047582909464836124,
552
+ 0.0025789525359869005,
553
+ -0.0007287326734513044,
554
+ 0.035997286438941956
555
+ ],
556
+ "std": [
557
+ 0.024339838465266404,
558
+ 0.06490750395949492,
559
+ 0.021401284949155275,
560
+ 0.05111120007770312,
561
+ 0.037778529131822655,
562
+ 0.05658410498726164,
563
+ 0.06271033042800869,
564
+ 0.17357673463760007
565
+ ],
566
+ "max": [
567
+ 0.21409234404563904,
568
+ 0.6854990124702454,
569
+ 0.30057650804519653,
570
+ 0.7143238186836243,
571
+ 0.6867426037788391,
572
+ 0.5510483980178833,
573
+ 0.5336411595344543,
574
+ 1.0
575
+ ],
576
+ "min": [
577
+ -0.2338617593050003,
578
+ -0.558387279510498,
579
+ -0.2482951432466507,
580
+ -0.6626467704772949,
581
+ -0.47793203592300415,
582
+ -0.584820032119751,
583
+ -0.7077043652534485,
584
+ 0.0
585
+ ],
586
+ "q01": [
587
+ -0.1346631145477295,
588
+ -0.3504452162981033,
589
+ -0.15663981318473816,
590
+ -0.24537096738815306,
591
+ -0.22821950614452363,
592
+ -0.42980227649211883,
593
+ -0.4895046579837799,
594
+ 0.0
595
+ ],
596
+ "q99": [
597
+ 0.1725029143691063,
598
+ 0.4685746806859974,
599
+ 0.10869869187474263,
600
+ 0.499900839328766,
601
+ 0.28230221629142765,
602
+ 0.3843919765949251,
603
+ 0.38130330502986914,
604
+ 1.0
605
+ ],
606
+ "mask": [
607
+ true,
608
+ true,
609
+ true,
610
+ true,
611
+ true,
612
+ true,
613
+ true,
614
+ false
615
+ ]
616
+ },
617
+ "state": {
618
+ "mean": [
619
+ 0.00031761352438479666,
620
+ 0.0020736783742904665,
621
+ 0.0034826237708330157,
622
+ -0.234240460395813,
623
+ -0.0018191402778029442,
624
+ 0.2424022436141968,
625
+ -0.001537260226905346,
626
+ 0.030011588335037233
627
+ ],
628
+ "std": [
629
+ 0.024077303105278742,
630
+ 0.08790303996624453,
631
+ 0.027178490734489504,
632
+ 0.7067546375834215,
633
+ 0.027173463008725068,
634
+ 0.7303538119052045,
635
+ 0.06428378288303241,
636
+ 0.1521238095109371
637
+ ],
638
+ "max": [
639
+ 0.2896324098110199,
640
+ 0.5507338047027588,
641
+ 0.31784605979919434,
642
+ -1.5832326412200928,
643
+ 0.3542541265487671,
644
+ 3.033360481262207,
645
+ 0.6994425058364868,
646
+ 1.0
647
+ ],
648
+ "min": [
649
+ -0.22138147056102753,
650
+ -0.8714362382888794,
651
+ -0.3488052189350128,
652
+ -2.7835195064544678,
653
+ -0.34267839789390564,
654
+ 1.3950575590133667,
655
+ -0.6863359808921814,
656
+ 0.0
657
+ ],
658
+ "q01": [
659
+ -0.18218472093343735,
660
+ -0.6171795415878296,
661
+ -0.13265437811613082,
662
+ -2.723349404335022,
663
+ -0.25293527901172635,
664
+ 1.8917096638679505,
665
+ -0.41360526919364926,
666
+ 0.0
667
+ ],
668
+ "q99": [
669
+ 0.23308583796024324,
670
+ 0.4467512100934983,
671
+ 0.26850769817829134,
672
+ -1.8047044682502746,
673
+ 0.1607170441746712,
674
+ 2.883582048416138,
675
+ 0.5439058530330658,
676
+ 1.0
677
+ ]
678
+ },
679
+ "num_transitions": 38179,
680
+ "num_trajectories": 202
681
+ }
682
+ }
0424_QwenPI_13tasks_actionstate_50k/final_model/pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b80626e3aaa399ee29f0845ded18039044f63838b249dd5bf7a0c863f7f6424
3
+ size 8269619462
0424_QwenPI_13tasks_actionstate_50k/run_qwenpi_vla.sh ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #export NCCL_SOCKET_IFNAME=bond0
2
+ #export NCCL_IB_HCA=mlx5_2,mlx5_3
3
+ export NCCL_BLOCKING_WAIT=1
4
+ export NCCL_ASYNC_ERROR_HANDLING=1
5
+ export NCCL_TIMEOUT=1000 # timeout set to 1 hour (unit: seconds)
6
+ export CUDA_VISIBLE_DEVICES=0,1,2,3
7
+
8
+ # === Please modify the following paths according to your environment ===
9
+ ###########################################################################################
10
+ run_root_dir=./runs
11
+ run_id=0424_QwenPI_13tasks_actionstate_50k
12
+ ###########################################################################################
13
+
14
+ output_dir=${run_root_dir}/${run_id}
15
+ mkdir -p ${output_dir}
16
+ cp $0 ${output_dir}/
17
+
18
+ accelerate launch \
19
+ --config_file ./starVLA/config/deepseeds/deepspeed_zero2.yaml \
20
+ --num_processes 4 \
21
+ --main_process_port 29800 \
22
+ starVLA/training/train_qwenpi.py \
23
+ --config_yaml ./starVLA/config/training/starvla_train_qwenpi.yaml \
24
+ --run_root_dir ${run_root_dir} \
25
+ --run_id ${run_id} \
26
+ --wandb_project vla_jepa \
27
+ --wandb_entity timsty
0424_QwenPI_13tasks_actionstate_50k/summary.jsonl ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {"steps": 5000}
2
+ {"steps": 10000}
3
+ {"steps": 15000}
4
+ {"steps": 20000}
5
+ {"steps": 25000}
6
+ {"steps": 30000}
7
+ {"steps": 35000}
8
+ {"steps": 40000}
9
+ {"steps": 45000}
10
+ {"steps": 50000}