chuanmew commited on
Commit
4e3c955
·
verified ·
1 Parent(s): a1565d4

test-2-checkpoint-70000

Browse files
test-2-checkpoint-70000/config.json ADDED
@@ -0,0 +1,130 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "batch_size": 64,
3
+ "buffer_size": 64,
4
+ "from_pretrained": "oxe-g2-checkpoint-300000",
5
+ "frozen_keys": [
6
+ "*hf_model*"
7
+ ],
8
+ "model": {
9
+ "heads": {
10
+ "action": {
11
+ "args": [],
12
+ "kwargs": {
13
+ "action_dim": 7,
14
+ "action_horizon": 4,
15
+ "readout_key": "readout_action",
16
+ "token_embedding_size": 768
17
+ },
18
+ "module": "model.octo.components.action_heads",
19
+ "name": "L1ActionHead"
20
+ }
21
+ },
22
+ "max_horizon": 10,
23
+ "observation_tokenizers": {
24
+ "primary": {
25
+ "args": [],
26
+ "kwargs": {
27
+ "encoder": {
28
+ "args": [],
29
+ "kwargs": {
30
+ "in_features": 6
31
+ },
32
+ "module": "octo.model.components.vit_encoders",
33
+ "name": "SmallStem16"
34
+ },
35
+ "obs_stack_keys": [
36
+ "image_primary"
37
+ ],
38
+ "task_stack_keys": [
39
+ "image_primary"
40
+ ]
41
+ },
42
+ "module": "octo.model.components.tokenizers",
43
+ "name": "ImageTokenizer"
44
+ }
45
+ },
46
+ "readouts": {
47
+ "action": 1
48
+ },
49
+ "repeat_task_tokens": true,
50
+ "task_tokenizers": {
51
+ "language": {
52
+ "args": [],
53
+ "kwargs": {
54
+ "encoder": "t5-base",
55
+ "finetune_encoder": false
56
+ },
57
+ "module": "octo.model.components.tokenizers",
58
+ "name": "LanguageTokenizer"
59
+ }
60
+ },
61
+ "token_embedding_size": 768,
62
+ "transformer_kwargs": {
63
+ "add_position_embedding": false,
64
+ "attention_dropout_rate": 0.0,
65
+ "dropout_rate": 0.0,
66
+ "mlp_dim": 3072,
67
+ "num_attention_heads": 12,
68
+ "num_layers": 12
69
+ },
70
+ "use_correct_attention": true
71
+ },
72
+ "normalize_method": "sign",
73
+ "obs_token_nums": {
74
+ "primary": 256
75
+ },
76
+ "sampler_num_samples": 2560000,
77
+ "seed": 2,
78
+ "subsample_length": 99999,
79
+ "text_processor": {
80
+ "args": [],
81
+ "kwargs": {
82
+ "encode_with_model": false,
83
+ "tokenizer_kwargs": {
84
+ "max_length": 16,
85
+ "padding": "max_length",
86
+ "return_tensors": "np",
87
+ "truncation": true
88
+ },
89
+ "tokenizer_name": "t5-base"
90
+ },
91
+ "module": "octo.components.text_processing",
92
+ "name": "HFTokenizer"
93
+ },
94
+ "training_arguments": {
95
+ "bf16": true,
96
+ "dataloader_pin_memory": true,
97
+ "ddp_find_unused_parameters": true,
98
+ "eval_steps": 5000,
99
+ "gradient_accumulation_steps": 4,
100
+ "learning_rate": 3e-05,
101
+ "logging_nan_inf_filter": false,
102
+ "logging_steps": 100,
103
+ "lr_scheduler_kwargs": {
104
+ "decay_type": "cosine",
105
+ "min_lr_ratio": 0.05,
106
+ "num_decay_steps": 298000
107
+ },
108
+ "lr_scheduler_type": "constant",
109
+ "max_grad_norm": 1.0,
110
+ "max_steps": 300000,
111
+ "optim": "adamw_torch_fused",
112
+ "per_device_eval_batch_size": 1,
113
+ "per_device_train_batch_size": 1,
114
+ "report_to": "wandb",
115
+ "save_safetensors": true,
116
+ "save_steps": 500,
117
+ "torch_compile": true,
118
+ "warmup_steps": 2000,
119
+ "weight_decay": 0.1
120
+ },
121
+ "training_keys": [
122
+ "*action*",
123
+ "*task_projections*",
124
+ "*obs_projections*",
125
+ "*readout_embeddings*",
126
+ "*task_pos_embeddings*",
127
+ "*obs_pos_embeddings*",
128
+ "*observation_tokenizers*"
129
+ ]
130
+ }
test-2-checkpoint-70000/dataset_statistics.json ADDED
@@ -0,0 +1,253 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "observation.images.main_camera": {
4
+ "min": [
5
+ [
6
+ [
7
+ 0.0
8
+ ]
9
+ ],
10
+ [
11
+ [
12
+ 0.0
13
+ ]
14
+ ],
15
+ [
16
+ [
17
+ 0.0
18
+ ]
19
+ ]
20
+ ],
21
+ "max": [
22
+ [
23
+ [
24
+ 1.0
25
+ ]
26
+ ],
27
+ [
28
+ [
29
+ 1.0
30
+ ]
31
+ ],
32
+ [
33
+ [
34
+ 1.0
35
+ ]
36
+ ]
37
+ ],
38
+ "mean": [
39
+ [
40
+ [
41
+ 0.56009308397514
42
+ ]
43
+ ],
44
+ [
45
+ [
46
+ 0.5088963212208076
47
+ ]
48
+ ],
49
+ [
50
+ [
51
+ 0.47626117961949455
52
+ ]
53
+ ]
54
+ ],
55
+ "std": [
56
+ [
57
+ [
58
+ 0.27688289864943944
59
+ ]
60
+ ],
61
+ [
62
+ [
63
+ 0.26883972589038224
64
+ ]
65
+ ],
66
+ [
67
+ [
68
+ 0.29031452356480364
69
+ ]
70
+ ]
71
+ ],
72
+ "count": [
73
+ 11006
74
+ ]
75
+ },
76
+ "episode_index": {
77
+ "min": [
78
+ 0
79
+ ],
80
+ "max": [
81
+ 128
82
+ ],
83
+ "mean": [
84
+ 63.14946338383838
85
+ ],
86
+ "std": [
87
+ 35.1467891774593
88
+ ],
89
+ "count": [
90
+ 12672
91
+ ]
92
+ },
93
+ "task_index": {
94
+ "min": [
95
+ 0
96
+ ],
97
+ "max": [
98
+ 3
99
+ ],
100
+ "mean": [
101
+ 1.6840277777777777
102
+ ],
103
+ "std": [
104
+ 1.1113384592218372
105
+ ],
106
+ "count": [
107
+ 12672
108
+ ]
109
+ },
110
+ "index": {
111
+ "min": [
112
+ 0
113
+ ],
114
+ "max": [
115
+ 12671
116
+ ],
117
+ "mean": [
118
+ 6335.5
119
+ ],
120
+ "std": [
121
+ 3658.0912941951938
122
+ ],
123
+ "count": [
124
+ 12672
125
+ ]
126
+ },
127
+ "action": {
128
+ "min": [
129
+ -0.009999999776482582,
130
+ -0.009999999776482582,
131
+ -0.009999999776482582,
132
+ -0.06283185631036758,
133
+ -0.06283185631036758,
134
+ -0.06283185631036758,
135
+ 0.0
136
+ ],
137
+ "max": [
138
+ 0.009999999776482582,
139
+ 0.009999999776482582,
140
+ 0.009999999776482582,
141
+ 0.06283185631036758,
142
+ 0.06283185631036758,
143
+ 0.06283185631036758,
144
+ 1.0
145
+ ],
146
+ "mean": [
147
+ -0.0010779668760702325,
148
+ -0.000870422678087375,
149
+ -0.0009524932320082003,
150
+ -0.00011404143052376722,
151
+ 0.001646163140721359,
152
+ 0.0006842485724881945,
153
+ 0.14094065714126566
154
+ ],
155
+ "std": [
156
+ 0.0050928476793778805,
157
+ 0.0052109778002382215,
158
+ 0.0062727072406226275,
159
+ 0.01305372613557191,
160
+ 0.014969692486291531,
161
+ 0.021519857205295197,
162
+ 0.3479603303557627
163
+ ],
164
+ "count": [
165
+ 12672
166
+ ],
167
+ "mask": [
168
+ true,
169
+ true,
170
+ true,
171
+ true,
172
+ true,
173
+ true,
174
+ false
175
+ ]
176
+ },
177
+ "timestamp": {
178
+ "min": [
179
+ 0.0
180
+ ],
181
+ "max": [
182
+ 22.5
183
+ ],
184
+ "mean": [
185
+ 5.516895517676768
186
+ ],
187
+ "std": [
188
+ 3.9518586666950704
189
+ ],
190
+ "count": [
191
+ 12672
192
+ ]
193
+ },
194
+ "frame_index": {
195
+ "min": [
196
+ 0
197
+ ],
198
+ "max": [
199
+ 225
200
+ ],
201
+ "mean": [
202
+ 55.168955176767675
203
+ ],
204
+ "std": [
205
+ 39.5185866669507
206
+ ],
207
+ "count": [
208
+ 12672
209
+ ]
210
+ },
211
+ "observation.state": {
212
+ "min": [
213
+ -0.6913691163063049,
214
+ -0.25204867124557495,
215
+ -0.22021731734275818,
216
+ -3.140528440475464,
217
+ -1.213579535484314,
218
+ -3.1340115070343018,
219
+ 0.0
220
+ ],
221
+ "max": [
222
+ -0.26134854555130005,
223
+ 0.40225377678871155,
224
+ 0.4610653519630432,
225
+ 3.1412761211395264,
226
+ 0.644866406917572,
227
+ 3.1401240825653076,
228
+ 1.0
229
+ ],
230
+ "mean": [
231
+ -0.4765559839921994,
232
+ 0.03277433536791847,
233
+ 0.01813845893630427,
234
+ 1.4840563985447381,
235
+ -0.1872646863000659,
236
+ -1.201557804914303,
237
+ 0.13328598546378098
238
+ ],
239
+ "std": [
240
+ 0.09873974979292631,
241
+ 0.12291375325367411,
242
+ 0.13182701724212956,
243
+ 2.530463134923631,
244
+ 0.39532953579234853,
245
+ 1.3639962652103377,
246
+ 0.33988356830665484
247
+ ],
248
+ "count": [
249
+ 12672
250
+ ]
251
+ }
252
+ }
253
+ ]
test-2-checkpoint-70000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f686ff77412f09b592ff0bc922f26ae973a07c61975436a5bdabb9ff32fafcfb
3
+ size 411689544
test-2-checkpoint-70000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f2a2272118836a8d03bddc028fcb808ce0f6c44f37a58295036d62f4762404
3
+ size 47821178
test-2-checkpoint-70000/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c64adfc39ddf34bd03bc0ab6fe68d49e82a985388b71b8cc49b7dd352e5c649
3
+ size 15984
test-2-checkpoint-70000/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f36a1096cb40e95d8e84ea3862b798a484a30e0a8ebb3bb1a5220302f46fefc1
3
+ size 15984
test-2-checkpoint-70000/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a3dc9e3c833675d4bbf2c68235d5d686c8ad6d78aca11a5f66c7cbe34095e7d
3
+ size 15984
test-2-checkpoint-70000/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b9f7e37e95713161cec3e9c231443964de1539ccd68294fd825ea36ad47a221
3
+ size 15984
test-2-checkpoint-70000/rng_state_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8718aa95680fbe8fdadfe4351118c070e65b8dc3fed83cc8fb4b570b7ddf1ba
3
+ size 15984
test-2-checkpoint-70000/rng_state_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c0260060bc6534e1b1c5e10f99f29994551a1bd48df5dbeeb245dd28a1e8c76
3
+ size 15984
test-2-checkpoint-70000/rng_state_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:842f7ffed8c88ae5c3d8bab1ef96f8dbd2420347168fbd5ce91dcc72986edb3a
3
+ size 15984
test-2-checkpoint-70000/rng_state_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:429e14c738c7a7ce8edcbf2402019efcca63d340aea41a4bc93636f2c4217c8d
3
+ size 15984
test-2-checkpoint-70000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8edce61df357bb337a4d784312fba372565bd9701024f6cf892be97ef55d8d77
3
+ size 1064
test-2-checkpoint-70000/trainer_state.json ADDED
The diff for this file is too large to render. See raw diff