bearlover365 commited on
Commit
f1e98f9
·
verified ·
1 Parent(s): 1e0d03b

Upload full checkpoint 200000

Browse files
pretrained_model/config.json ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "type": "act",
3
+ "n_obs_steps": 1,
4
+ "normalization_mapping": {
5
+ "VISUAL": "MEAN_STD",
6
+ "STATE": "MEAN_STD",
7
+ "ACTION": "MEAN_STD"
8
+ },
9
+ "input_features": {
10
+ "observation.state": {
11
+ "type": "STATE",
12
+ "shape": [
13
+ 6
14
+ ]
15
+ },
16
+ "observation.images.wrist": {
17
+ "type": "VISUAL",
18
+ "shape": [
19
+ 3,
20
+ 480,
21
+ 640
22
+ ]
23
+ }
24
+ },
25
+ "output_features": {
26
+ "action": {
27
+ "type": "ACTION",
28
+ "shape": [
29
+ 6
30
+ ]
31
+ }
32
+ },
33
+ "device": "cuda",
34
+ "use_amp": false,
35
+ "push_to_hub": true,
36
+ "repo_id": "bearlover365/d4_dataset_only_2_validation_episodes",
37
+ "private": null,
38
+ "tags": null,
39
+ "license": null,
40
+ "chunk_size": 100,
41
+ "n_action_steps": 100,
42
+ "vision_backbone": "resnet18",
43
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
44
+ "replace_final_stride_with_dilation": 0,
45
+ "pre_norm": false,
46
+ "dim_model": 512,
47
+ "n_heads": 8,
48
+ "dim_feedforward": 3200,
49
+ "feedforward_activation": "relu",
50
+ "n_encoder_layers": 4,
51
+ "n_decoder_layers": 1,
52
+ "use_vae": true,
53
+ "latent_dim": 32,
54
+ "n_vae_encoder_layers": 4,
55
+ "temporal_ensemble_coeff": null,
56
+ "dropout": 0.1,
57
+ "kl_weight": 10.0,
58
+ "optimizer_lr": 1e-05,
59
+ "optimizer_weight_decay": 0.0001,
60
+ "optimizer_lr_backbone": 1e-05
61
+ }
pretrained_model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5308429a30ea90f02206cfded10bdda6cbd7e4d4f6db359d42db7af3f4d7ed9d
3
+ size 206700792
pretrained_model/train_config.json ADDED
@@ -0,0 +1,174 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": {
3
+ "repo_id": "bearlover365/pick_place_up_to_four_white_socks_varying_daylight_intensity_train",
4
+ "root": null,
5
+ "episodes": null,
6
+ "val_episodes": [
7
+ 0,
8
+ 1
9
+ ],
10
+ "val_repo_id": "bearlover365/pick_place_up_to_four_white_socks_varying_daylight_intensity_validation_episode_0_and_72",
11
+ "image_transforms": {
12
+ "enable": false,
13
+ "max_num_transforms": 3,
14
+ "random_order": false,
15
+ "tfs": {
16
+ "brightness": {
17
+ "weight": 1.0,
18
+ "type": "ColorJitter",
19
+ "kwargs": {
20
+ "brightness": [
21
+ 0.8,
22
+ 1.2
23
+ ]
24
+ }
25
+ },
26
+ "contrast": {
27
+ "weight": 1.0,
28
+ "type": "ColorJitter",
29
+ "kwargs": {
30
+ "contrast": [
31
+ 0.8,
32
+ 1.2
33
+ ]
34
+ }
35
+ },
36
+ "saturation": {
37
+ "weight": 1.0,
38
+ "type": "ColorJitter",
39
+ "kwargs": {
40
+ "saturation": [
41
+ 0.5,
42
+ 1.5
43
+ ]
44
+ }
45
+ },
46
+ "hue": {
47
+ "weight": 1.0,
48
+ "type": "ColorJitter",
49
+ "kwargs": {
50
+ "hue": [
51
+ -0.05,
52
+ 0.05
53
+ ]
54
+ }
55
+ },
56
+ "sharpness": {
57
+ "weight": 1.0,
58
+ "type": "SharpnessJitter",
59
+ "kwargs": {
60
+ "sharpness": [
61
+ 0.5,
62
+ 1.5
63
+ ]
64
+ }
65
+ }
66
+ }
67
+ },
68
+ "revision": null,
69
+ "use_imagenet_stats": true,
70
+ "video_backend": "pyav"
71
+ },
72
+ "env": null,
73
+ "policy": {
74
+ "type": "act",
75
+ "n_obs_steps": 1,
76
+ "normalization_mapping": {
77
+ "VISUAL": "MEAN_STD",
78
+ "STATE": "MEAN_STD",
79
+ "ACTION": "MEAN_STD"
80
+ },
81
+ "input_features": {
82
+ "observation.state": {
83
+ "type": "STATE",
84
+ "shape": [
85
+ 6
86
+ ]
87
+ },
88
+ "observation.images.wrist": {
89
+ "type": "VISUAL",
90
+ "shape": [
91
+ 3,
92
+ 480,
93
+ 640
94
+ ]
95
+ }
96
+ },
97
+ "output_features": {
98
+ "action": {
99
+ "type": "ACTION",
100
+ "shape": [
101
+ 6
102
+ ]
103
+ }
104
+ },
105
+ "device": "cuda",
106
+ "use_amp": false,
107
+ "push_to_hub": true,
108
+ "repo_id": "bearlover365/d4_dataset_only_2_validation_episodes",
109
+ "private": null,
110
+ "tags": null,
111
+ "license": null,
112
+ "chunk_size": 100,
113
+ "n_action_steps": 100,
114
+ "vision_backbone": "resnet18",
115
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
116
+ "replace_final_stride_with_dilation": 0,
117
+ "pre_norm": false,
118
+ "dim_model": 512,
119
+ "n_heads": 8,
120
+ "dim_feedforward": 3200,
121
+ "feedforward_activation": "relu",
122
+ "n_encoder_layers": 4,
123
+ "n_decoder_layers": 1,
124
+ "use_vae": true,
125
+ "latent_dim": 32,
126
+ "n_vae_encoder_layers": 4,
127
+ "temporal_ensemble_coeff": null,
128
+ "dropout": 0.1,
129
+ "kl_weight": 10.0,
130
+ "optimizer_lr": 1e-05,
131
+ "optimizer_weight_decay": 0.0001,
132
+ "optimizer_lr_backbone": 1e-05
133
+ },
134
+ "output_dir": "/teamspace/studios/this_studio/lerobot/outputs/train/d4_dataset_only_2_validation_episodes/checkpoints",
135
+ "job_name": "d4_dataset_only_2_validation_episodes_checkpoint_25k_300k_steps_20250823_174025_bs8_lr1.0e-05_bblr1.0e-05_smp4000000_bs8_lr1.0e-05_bblr1.0e-05_smp4000000",
136
+ "resume": true,
137
+ "seed": 1000,
138
+ "num_workers": 4,
139
+ "batch_size": 8,
140
+ "steps": 500000,
141
+ "target_samples": null,
142
+ "eval_freq": 5000,
143
+ "log_freq": 200,
144
+ "save_checkpoint": true,
145
+ "save_freq": 50000,
146
+ "use_policy_training_preset": true,
147
+ "optimizer": {
148
+ "type": "adamw",
149
+ "lr": 1e-05,
150
+ "weight_decay": 0.0001,
151
+ "grad_clip_norm": 10.0,
152
+ "betas": [
153
+ 0.9,
154
+ 0.999
155
+ ],
156
+ "eps": 1e-08
157
+ },
158
+ "scheduler": null,
159
+ "eval": {
160
+ "n_episodes": 50,
161
+ "batch_size": 50,
162
+ "use_async_envs": false
163
+ },
164
+ "initial_step": 0,
165
+ "wandb": {
166
+ "enable": true,
167
+ "disable_artifact": false,
168
+ "project": "lerobot",
169
+ "entity": "benfduffy-bearcover-gmbh",
170
+ "notes": null,
171
+ "run_id": "ms2tqgeo",
172
+ "mode": null
173
+ }
174
+ }
training_state/optimizer_param_groups.json ADDED
@@ -0,0 +1,191 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "lr": 1e-05,
4
+ "betas": [
5
+ 0.9,
6
+ 0.999
7
+ ],
8
+ "eps": 1e-08,
9
+ "weight_decay": 0.0001,
10
+ "amsgrad": false,
11
+ "maximize": false,
12
+ "foreach": null,
13
+ "capturable": false,
14
+ "differentiable": false,
15
+ "fused": null,
16
+ "decoupled_weight_decay": true,
17
+ "params": [
18
+ 0,
19
+ 1,
20
+ 2,
21
+ 3,
22
+ 4,
23
+ 5,
24
+ 6,
25
+ 7,
26
+ 8,
27
+ 9,
28
+ 10,
29
+ 11,
30
+ 12,
31
+ 13,
32
+ 14,
33
+ 15,
34
+ 16,
35
+ 17,
36
+ 18,
37
+ 19,
38
+ 20,
39
+ 21,
40
+ 22,
41
+ 23,
42
+ 24,
43
+ 25,
44
+ 26,
45
+ 27,
46
+ 28,
47
+ 29,
48
+ 30,
49
+ 31,
50
+ 32,
51
+ 33,
52
+ 34,
53
+ 35,
54
+ 36,
55
+ 37,
56
+ 38,
57
+ 39,
58
+ 40,
59
+ 41,
60
+ 42,
61
+ 43,
62
+ 44,
63
+ 45,
64
+ 46,
65
+ 47,
66
+ 48,
67
+ 49,
68
+ 50,
69
+ 51,
70
+ 52,
71
+ 53,
72
+ 54,
73
+ 55,
74
+ 56,
75
+ 57,
76
+ 58,
77
+ 59,
78
+ 60,
79
+ 61,
80
+ 62,
81
+ 63,
82
+ 64,
83
+ 65,
84
+ 66,
85
+ 67,
86
+ 68,
87
+ 69,
88
+ 70,
89
+ 71,
90
+ 72,
91
+ 73,
92
+ 74,
93
+ 75,
94
+ 76,
95
+ 77,
96
+ 78,
97
+ 79,
98
+ 80,
99
+ 81,
100
+ 82,
101
+ 83,
102
+ 84,
103
+ 85,
104
+ 86,
105
+ 87,
106
+ 88,
107
+ 89,
108
+ 90,
109
+ 91,
110
+ 92,
111
+ 93,
112
+ 94,
113
+ 95,
114
+ 96,
115
+ 97,
116
+ 98,
117
+ 99,
118
+ 100,
119
+ 101,
120
+ 102,
121
+ 103,
122
+ 104,
123
+ 105,
124
+ 106,
125
+ 107,
126
+ 108,
127
+ 109,
128
+ 110,
129
+ 111,
130
+ 112,
131
+ 113,
132
+ 114,
133
+ 115,
134
+ 116,
135
+ 117,
136
+ 118,
137
+ 119,
138
+ 120,
139
+ 121,
140
+ 122,
141
+ 123,
142
+ 124,
143
+ 125,
144
+ 126,
145
+ 127,
146
+ 128,
147
+ 129,
148
+ 130,
149
+ 131,
150
+ 132
151
+ ]
152
+ },
153
+ {
154
+ "lr": 1e-05,
155
+ "betas": [
156
+ 0.9,
157
+ 0.999
158
+ ],
159
+ "eps": 1e-08,
160
+ "weight_decay": 0.0001,
161
+ "amsgrad": false,
162
+ "maximize": false,
163
+ "foreach": null,
164
+ "capturable": false,
165
+ "differentiable": false,
166
+ "fused": null,
167
+ "decoupled_weight_decay": true,
168
+ "params": [
169
+ 133,
170
+ 134,
171
+ 135,
172
+ 136,
173
+ 137,
174
+ 138,
175
+ 139,
176
+ 140,
177
+ 141,
178
+ 142,
179
+ 143,
180
+ 144,
181
+ 145,
182
+ 146,
183
+ 147,
184
+ 148,
185
+ 149,
186
+ 150,
187
+ 151,
188
+ 152
189
+ ]
190
+ }
191
+ ]
training_state/optimizer_state.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e17315c24e828e72baa561fd203efbec077ba345631c50d655952a1ab00fa681
3
+ size 412817652
training_state/rng_state.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3f34babfa64754fcb4fd133bce2418b83fe9c39916c1bd559c39876cb336473
3
+ size 15708
training_state/training_step.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "step": 200000
3
+ }