nextbig commited on
Commit
c8eeae0
·
verified ·
1 Parent(s): 031b206

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_dim": 32,
3
+ "action_head_cfg": {
4
+ "action_dim": 32,
5
+ "action_horizon": 16,
6
+ "add_pos_embed": true,
7
+ "backbone_embedding_dim": 2048,
8
+ "diffusion_model_cfg": {
9
+ "attention_head_dim": 48,
10
+ "cross_attention_dim": 2048,
11
+ "dropout": 0.2,
12
+ "final_dropout": true,
13
+ "interleave_self_attention": true,
14
+ "norm_type": "ada_norm",
15
+ "num_attention_heads": 32,
16
+ "num_layers": 16,
17
+ "output_dim": 1024,
18
+ "positional_embeddings": null
19
+ },
20
+ "hidden_size": 1024,
21
+ "input_embedding_dim": 1536,
22
+ "max_action_dim": 32,
23
+ "max_state_dim": 64,
24
+ "model_dtype": "float32",
25
+ "noise_beta_alpha": 1.5,
26
+ "noise_beta_beta": 1.0,
27
+ "noise_s": 0.999,
28
+ "num_inference_timesteps": 4,
29
+ "num_target_vision_tokens": 32,
30
+ "num_timestep_buckets": 1000,
31
+ "tune_diffusion_model": true,
32
+ "tune_projector": true,
33
+ "use_vlln": true,
34
+ "vl_self_attention_cfg": {
35
+ "attention_head_dim": 64,
36
+ "dropout": 0.2,
37
+ "final_dropout": true,
38
+ "num_attention_heads": 32,
39
+ "num_layers": 4,
40
+ "positional_embeddings": null
41
+ }
42
+ },
43
+ "action_horizon": 16,
44
+ "architectures": [
45
+ "GR00T_N1_5"
46
+ ],
47
+ "attn_implementation": null,
48
+ "backbone_cfg": {
49
+ "eagle_path": "NVEagle/eagle_er-qwen3_1_7B-Siglip2_400M_stage1_5_128gpu_er_v7_1mlp_nops",
50
+ "load_bf16": false,
51
+ "project_to_dim": null,
52
+ "reproject_vision": false,
53
+ "select_layer": 12,
54
+ "tune_llm": false,
55
+ "tune_visual": true,
56
+ "use_flash_attention": true
57
+ },
58
+ "compute_dtype": "bfloat16",
59
+ "hidden_size": 2048,
60
+ "model_dtype": "float32",
61
+ "model_type": "gr00t_n1_5",
62
+ "torch_dtype": "bfloat16",
63
+ "transformers_version": "4.52.1"
64
+ }
experiment_cfg/metadata.json ADDED
@@ -0,0 +1,387 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "statistics": {
4
+ "state": {
5
+ "left_arm": {
6
+ "max": [
7
+ 0.23685863614082336,
8
+ 2.63502836227417,
9
+ 0.03330088034272194,
10
+ 1.4575419425964355,
11
+ 0.8281587362289429,
12
+ 1.9787147045135498
13
+ ],
14
+ "min": [
15
+ -0.797720193862915,
16
+ -0.012758356519043446,
17
+ -2.2290821075439453,
18
+ -1.7361313104629517,
19
+ -0.532290518283844,
20
+ -1.4025291204452515
21
+ ],
22
+ "mean": [
23
+ -0.09467598050832748,
24
+ 0.29610729217529297,
25
+ -0.1754428744316101,
26
+ -0.0011706651421263814,
27
+ 0.08008287101984024,
28
+ 0.004690642934292555
29
+ ],
30
+ "std": [
31
+ 0.11690603941679001,
32
+ 0.6777294278144836,
33
+ 0.4925391376018524,
34
+ 0.22012004256248474,
35
+ 0.08415775001049042,
36
+ 0.2379513680934906
37
+ ],
38
+ "q01": [
39
+ -0.6201645332574844,
40
+ -0.012758356519043446,
41
+ -1.8302751040458678,
42
+ -0.8233977997303008,
43
+ -0.25266467064619064,
44
+ -0.6677455306053162
45
+ ],
46
+ "q99": [
47
+ 0.0558854416012764,
48
+ 2.305639197826385,
49
+ 0.03330088034272194,
50
+ 0.8909350645542136,
51
+ 0.378433117866516,
52
+ 0.9695222181081766
53
+ ]
54
+ },
55
+ "left_gripper": {
56
+ "max": [
57
+ 0.054858461022377014
58
+ ],
59
+ "min": [
60
+ -0.0037799999117851257
61
+ ],
62
+ "mean": [
63
+ 0.0005394071922637522
64
+ ],
65
+ "std": [
66
+ 0.008630749769508839
67
+ ],
68
+ "q01": [
69
+ -0.0037799999117851257
70
+ ],
71
+ "q99": [
72
+ 0.04758923128247261
73
+ ]
74
+ },
75
+ "right_arm": {
76
+ "max": [
77
+ 0.8744099736213684,
78
+ 2.716465473175049,
79
+ 0.010594148188829422,
80
+ 1.7382432222366333,
81
+ 1.2609829902648926,
82
+ 0.7371398210525513
83
+ ],
84
+ "min": [
85
+ -0.30108675360679626,
86
+ 0.0,
87
+ -2.7580041885375977,
88
+ -1.2717341184616089,
89
+ -0.7101046442985535,
90
+ -2.1718528270721436
91
+ ],
92
+ "mean": [
93
+ 0.13320903480052948,
94
+ 1.0849677324295044,
95
+ -0.8214209079742432,
96
+ 0.08245757967233658,
97
+ 0.34770581126213074,
98
+ -0.34033045172691345
99
+ ],
100
+ "std": [
101
+ 0.23607806861400604,
102
+ 0.958350658416748,
103
+ 0.8432449102401733,
104
+ 0.26838839054107666,
105
+ 0.4480270445346832,
106
+ 0.4256483316421509
107
+ ],
108
+ "q01": [
109
+ -0.1667721477150917,
110
+ 0.0,
111
+ -2.3997578620910645,
112
+ -0.7350239264965057,
113
+ -0.21033382192254066,
114
+ -1.8293345880508423
115
+ ],
116
+ "q99": [
117
+ 0.734721313714981,
118
+ 2.5196237874031064,
119
+ 0.009965830482542515,
120
+ 1.0604445934295654,
121
+ 1.2147316932678223,
122
+ 0.37224382162094116
123
+ ]
124
+ },
125
+ "right_gripper": {
126
+ "max": [
127
+ 0.08273077011108398
128
+ ],
129
+ "min": [
130
+ -0.0005769230774603784
131
+ ],
132
+ "mean": [
133
+ 0.017459724098443985
134
+ ],
135
+ "std": [
136
+ 0.02439081110060215
137
+ ],
138
+ "q01": [
139
+ -0.0004615384677890688
140
+ ],
141
+ "q99": [
142
+ 0.07165384292602539
143
+ ]
144
+ }
145
+ },
146
+ "action": {
147
+ "left_arm": {
148
+ "max": [
149
+ 0.23685863614082336,
150
+ 2.63502836227417,
151
+ 0.03330088034272194,
152
+ 1.4575419425964355,
153
+ 0.8281587362289429,
154
+ 1.9787147045135498
155
+ ],
156
+ "min": [
157
+ -0.797720193862915,
158
+ -0.012758356519043446,
159
+ -2.2290821075439453,
160
+ -1.7361313104629517,
161
+ -0.532290518283844,
162
+ -1.4025291204452515
163
+ ],
164
+ "mean": [
165
+ -0.09467556327581406,
166
+ 0.2961057424545288,
167
+ -0.1754431128501892,
168
+ -0.0011543770087882876,
169
+ 0.08008351922035217,
170
+ 0.0046795387752354145
171
+ ],
172
+ "std": [
173
+ 0.11690639704465866,
174
+ 0.6777272820472717,
175
+ 0.4925388991832733,
176
+ 0.2201227992773056,
177
+ 0.08415870368480682,
178
+ 0.23795734345912933
179
+ ],
180
+ "q01": [
181
+ -0.6201645332574844,
182
+ -0.012758356519043446,
183
+ -1.8302751040458678,
184
+ -0.8233977997303008,
185
+ -0.25266467064619064,
186
+ -0.6677455306053162
187
+ ],
188
+ "q99": [
189
+ 0.0558854416012764,
190
+ 2.305639197826385,
191
+ 0.03330088034272194,
192
+ 0.8909350645542136,
193
+ 0.378433117866516,
194
+ 0.9695222181081766
195
+ ]
196
+ },
197
+ "left_gripper": {
198
+ "max": [
199
+ 0.054858461022377014
200
+ ],
201
+ "min": [
202
+ -0.0037799999117851257
203
+ ],
204
+ "mean": [
205
+ 0.0005394072504714131
206
+ ],
207
+ "std": [
208
+ 0.008630749769508839
209
+ ],
210
+ "q01": [
211
+ -0.0037799999117851257
212
+ ],
213
+ "q99": [
214
+ 0.04758923128247261
215
+ ]
216
+ },
217
+ "right_arm": {
218
+ "max": [
219
+ 0.8744099736213684,
220
+ 2.716465473175049,
221
+ 0.010594148188829422,
222
+ 1.7382432222366333,
223
+ 1.2609829902648926,
224
+ 0.7371398210525513
225
+ ],
226
+ "min": [
227
+ -0.30108675360679626,
228
+ 0.0,
229
+ -2.7580041885375977,
230
+ -1.2717341184616089,
231
+ -0.7101046442985535,
232
+ -2.1718528270721436
233
+ ],
234
+ "mean": [
235
+ 0.13320539891719818,
236
+ 1.084963083267212,
237
+ -0.8214203119277954,
238
+ 0.08245743811130524,
239
+ 0.3477059602737427,
240
+ -0.3403414785861969
241
+ ],
242
+ "std": [
243
+ 0.23608171939849854,
244
+ 0.958354115486145,
245
+ 0.8432462811470032,
246
+ 0.2683871388435364,
247
+ 0.44802600145339966,
248
+ 0.4256395101547241
249
+ ],
250
+ "q01": [
251
+ -0.16684684187173843,
252
+ 0.0,
253
+ -2.3997578620910645,
254
+ -0.7350239264965057,
255
+ -0.21033382192254066,
256
+ -1.8293345880508423
257
+ ],
258
+ "q99": [
259
+ 0.734721313714981,
260
+ 2.5196237874031064,
261
+ 0.009965830482542515,
262
+ 1.0604445934295654,
263
+ 1.2147316932678223,
264
+ 0.37224382162094116
265
+ ]
266
+ },
267
+ "right_gripper": {
268
+ "max": [
269
+ 0.08273077011108398
270
+ ],
271
+ "min": [
272
+ -0.0005769230774603784
273
+ ],
274
+ "mean": [
275
+ 0.01745966635644436
276
+ ],
277
+ "std": [
278
+ 0.024390874430537224
279
+ ],
280
+ "q01": [
281
+ -0.0004615384677890688
282
+ ],
283
+ "q99": [
284
+ 0.07165384292602539
285
+ ]
286
+ }
287
+ }
288
+ },
289
+ "modalities": {
290
+ "video": {
291
+ "cam_high": {
292
+ "resolution": [
293
+ 640,
294
+ 480
295
+ ],
296
+ "channels": 3,
297
+ "fps": 30.0
298
+ },
299
+ "cam_left_wrist": {
300
+ "resolution": [
301
+ 640,
302
+ 480
303
+ ],
304
+ "channels": 3,
305
+ "fps": 30.0
306
+ },
307
+ "cam_right_wrist": {
308
+ "resolution": [
309
+ 640,
310
+ 480
311
+ ],
312
+ "channels": 3,
313
+ "fps": 30.0
314
+ }
315
+ },
316
+ "state": {
317
+ "left_arm": {
318
+ "absolute": true,
319
+ "rotation_type": null,
320
+ "shape": [
321
+ 6
322
+ ],
323
+ "continuous": true
324
+ },
325
+ "left_gripper": {
326
+ "absolute": true,
327
+ "rotation_type": null,
328
+ "shape": [
329
+ 1
330
+ ],
331
+ "continuous": true
332
+ },
333
+ "right_arm": {
334
+ "absolute": true,
335
+ "rotation_type": null,
336
+ "shape": [
337
+ 6
338
+ ],
339
+ "continuous": true
340
+ },
341
+ "right_gripper": {
342
+ "absolute": true,
343
+ "rotation_type": null,
344
+ "shape": [
345
+ 1
346
+ ],
347
+ "continuous": true
348
+ }
349
+ },
350
+ "action": {
351
+ "left_arm": {
352
+ "absolute": true,
353
+ "rotation_type": null,
354
+ "shape": [
355
+ 6
356
+ ],
357
+ "continuous": true
358
+ },
359
+ "left_gripper": {
360
+ "absolute": true,
361
+ "rotation_type": null,
362
+ "shape": [
363
+ 1
364
+ ],
365
+ "continuous": true
366
+ },
367
+ "right_arm": {
368
+ "absolute": true,
369
+ "rotation_type": null,
370
+ "shape": [
371
+ 6
372
+ ],
373
+ "continuous": true
374
+ },
375
+ "right_gripper": {
376
+ "absolute": true,
377
+ "rotation_type": null,
378
+ "shape": [
379
+ 1
380
+ ],
381
+ "continuous": true
382
+ }
383
+ }
384
+ },
385
+ "embodiment_tag": "new_embodiment"
386
+ }
387
+ }
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa3f287d6c0393470bfd6945e9a815b4644b786e6b8dff364a8a890cbea093ca
3
+ size 4999367032
model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7874b00e0770a305f5f76e0127dec1c1dd441647c2bf981c792cc077553b469
3
+ size 2586705312
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71308f727e1b5bfab40404f81b9ddd4500ba137b42bdb6018a29783d6e1d8782
3
+ size 5713