nisiwaki commited on
Commit
4332033
·
verified ·
1 Parent(s): 7706ff8

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ wandb/run-20251206_005455-fytl4nqj/run-fytl4nqj.wandb filter=lfs diff=lfs merge=lfs -text
checkpoints/010000/pretrained_model/config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "type": "act",
3
+ "n_obs_steps": 1,
4
+ "input_features": {
5
+ "observation.state": {
6
+ "type": "STATE",
7
+ "shape": [
8
+ 6
9
+ ]
10
+ },
11
+ "observation.images.top": {
12
+ "type": "VISUAL",
13
+ "shape": [
14
+ 3,
15
+ 480,
16
+ 640
17
+ ]
18
+ },
19
+ "observation.images.side": {
20
+ "type": "VISUAL",
21
+ "shape": [
22
+ 3,
23
+ 480,
24
+ 640
25
+ ]
26
+ }
27
+ },
28
+ "output_features": {
29
+ "action": {
30
+ "type": "ACTION",
31
+ "shape": [
32
+ 6
33
+ ]
34
+ }
35
+ },
36
+ "device": "cuda",
37
+ "use_amp": false,
38
+ "push_to_hub": false,
39
+ "repo_id": null,
40
+ "private": null,
41
+ "tags": null,
42
+ "license": null,
43
+ "pretrained_path": null,
44
+ "chunk_size": 100,
45
+ "n_action_steps": 100,
46
+ "normalization_mapping": {
47
+ "VISUAL": "MEAN_STD",
48
+ "STATE": "MEAN_STD",
49
+ "ACTION": "MEAN_STD"
50
+ },
51
+ "vision_backbone": "resnet18",
52
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
53
+ "replace_final_stride_with_dilation": false,
54
+ "pre_norm": false,
55
+ "dim_model": 512,
56
+ "n_heads": 8,
57
+ "dim_feedforward": 3200,
58
+ "feedforward_activation": "relu",
59
+ "n_encoder_layers": 4,
60
+ "n_decoder_layers": 1,
61
+ "use_vae": true,
62
+ "latent_dim": 32,
63
+ "n_vae_encoder_layers": 4,
64
+ "temporal_ensemble_coeff": null,
65
+ "dropout": 0.1,
66
+ "kl_weight": 10.0,
67
+ "optimizer_lr": 1e-05,
68
+ "optimizer_weight_decay": 0.0001,
69
+ "optimizer_lr_backbone": 1e-05
70
+ }
checkpoints/010000/pretrained_model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8efdc98927f38b12e40e9c87d699071c1889bf4863a9a26272c21b495fdaec0d
3
+ size 206699736
checkpoints/010000/pretrained_model/policy_postprocessor.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "policy_postprocessor",
3
+ "steps": [
4
+ {
5
+ "registry_name": "unnormalizer_processor",
6
+ "config": {
7
+ "eps": 1e-08,
8
+ "features": {
9
+ "action": {
10
+ "type": "ACTION",
11
+ "shape": [
12
+ 6
13
+ ]
14
+ }
15
+ },
16
+ "norm_map": {
17
+ "VISUAL": "MEAN_STD",
18
+ "STATE": "MEAN_STD",
19
+ "ACTION": "MEAN_STD"
20
+ }
21
+ },
22
+ "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors"
23
+ },
24
+ {
25
+ "registry_name": "device_processor",
26
+ "config": {
27
+ "device": "cpu",
28
+ "float_dtype": null
29
+ }
30
+ }
31
+ ]
32
+ }
checkpoints/010000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:842dd3d16d4d2201f615433025e50510e8adec8b4c129afcf4f5314bbcdbd523
3
+ size 7520
checkpoints/010000/pretrained_model/policy_preprocessor.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "policy_preprocessor",
3
+ "steps": [
4
+ {
5
+ "registry_name": "rename_observations_processor",
6
+ "config": {
7
+ "rename_map": {}
8
+ }
9
+ },
10
+ {
11
+ "registry_name": "to_batch_processor",
12
+ "config": {}
13
+ },
14
+ {
15
+ "registry_name": "device_processor",
16
+ "config": {
17
+ "device": "cuda",
18
+ "float_dtype": null
19
+ }
20
+ },
21
+ {
22
+ "registry_name": "normalizer_processor",
23
+ "config": {
24
+ "eps": 1e-08,
25
+ "features": {
26
+ "observation.state": {
27
+ "type": "STATE",
28
+ "shape": [
29
+ 6
30
+ ]
31
+ },
32
+ "observation.images.top": {
33
+ "type": "VISUAL",
34
+ "shape": [
35
+ 3,
36
+ 480,
37
+ 640
38
+ ]
39
+ },
40
+ "observation.images.side": {
41
+ "type": "VISUAL",
42
+ "shape": [
43
+ 3,
44
+ 480,
45
+ 640
46
+ ]
47
+ },
48
+ "action": {
49
+ "type": "ACTION",
50
+ "shape": [
51
+ 6
52
+ ]
53
+ }
54
+ },
55
+ "norm_map": {
56
+ "VISUAL": "MEAN_STD",
57
+ "STATE": "MEAN_STD",
58
+ "ACTION": "MEAN_STD"
59
+ }
60
+ },
61
+ "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors"
62
+ }
63
+ ]
64
+ }
checkpoints/010000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:842dd3d16d4d2201f615433025e50510e8adec8b4c129afcf4f5314bbcdbd523
3
+ size 7520
checkpoints/010000/pretrained_model/train_config.json ADDED
@@ -0,0 +1,193 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": {
3
+ "repo_id": "AmdRamen/mission1_record_edited",
4
+ "root": null,
5
+ "episodes": null,
6
+ "image_transforms": {
7
+ "enable": false,
8
+ "max_num_transforms": 3,
9
+ "random_order": false,
10
+ "tfs": {
11
+ "brightness": {
12
+ "weight": 1.0,
13
+ "type": "ColorJitter",
14
+ "kwargs": {
15
+ "brightness": [
16
+ 0.8,
17
+ 1.2
18
+ ]
19
+ }
20
+ },
21
+ "contrast": {
22
+ "weight": 1.0,
23
+ "type": "ColorJitter",
24
+ "kwargs": {
25
+ "contrast": [
26
+ 0.8,
27
+ 1.2
28
+ ]
29
+ }
30
+ },
31
+ "saturation": {
32
+ "weight": 1.0,
33
+ "type": "ColorJitter",
34
+ "kwargs": {
35
+ "saturation": [
36
+ 0.5,
37
+ 1.5
38
+ ]
39
+ }
40
+ },
41
+ "hue": {
42
+ "weight": 1.0,
43
+ "type": "ColorJitter",
44
+ "kwargs": {
45
+ "hue": [
46
+ -0.05,
47
+ 0.05
48
+ ]
49
+ }
50
+ },
51
+ "sharpness": {
52
+ "weight": 1.0,
53
+ "type": "SharpnessJitter",
54
+ "kwargs": {
55
+ "sharpness": [
56
+ 0.5,
57
+ 1.5
58
+ ]
59
+ }
60
+ },
61
+ "affine": {
62
+ "weight": 1.0,
63
+ "type": "RandomAffine",
64
+ "kwargs": {
65
+ "degrees": [
66
+ -5.0,
67
+ 5.0
68
+ ],
69
+ "translate": [
70
+ 0.05,
71
+ 0.05
72
+ ]
73
+ }
74
+ }
75
+ }
76
+ },
77
+ "revision": null,
78
+ "use_imagenet_stats": true,
79
+ "video_backend": "torchcodec",
80
+ "streaming": false
81
+ },
82
+ "env": null,
83
+ "policy": {
84
+ "type": "act",
85
+ "n_obs_steps": 1,
86
+ "input_features": {
87
+ "observation.state": {
88
+ "type": "STATE",
89
+ "shape": [
90
+ 6
91
+ ]
92
+ },
93
+ "observation.images.top": {
94
+ "type": "VISUAL",
95
+ "shape": [
96
+ 3,
97
+ 480,
98
+ 640
99
+ ]
100
+ },
101
+ "observation.images.side": {
102
+ "type": "VISUAL",
103
+ "shape": [
104
+ 3,
105
+ 480,
106
+ 640
107
+ ]
108
+ }
109
+ },
110
+ "output_features": {
111
+ "action": {
112
+ "type": "ACTION",
113
+ "shape": [
114
+ 6
115
+ ]
116
+ }
117
+ },
118
+ "device": "cuda",
119
+ "use_amp": false,
120
+ "push_to_hub": false,
121
+ "repo_id": null,
122
+ "private": null,
123
+ "tags": null,
124
+ "license": null,
125
+ "pretrained_path": null,
126
+ "chunk_size": 100,
127
+ "n_action_steps": 100,
128
+ "normalization_mapping": {
129
+ "VISUAL": "MEAN_STD",
130
+ "STATE": "MEAN_STD",
131
+ "ACTION": "MEAN_STD"
132
+ },
133
+ "vision_backbone": "resnet18",
134
+ "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
135
+ "replace_final_stride_with_dilation": false,
136
+ "pre_norm": false,
137
+ "dim_model": 512,
138
+ "n_heads": 8,
139
+ "dim_feedforward": 3200,
140
+ "feedforward_activation": "relu",
141
+ "n_encoder_layers": 4,
142
+ "n_decoder_layers": 1,
143
+ "use_vae": true,
144
+ "latent_dim": 32,
145
+ "n_vae_encoder_layers": 4,
146
+ "temporal_ensemble_coeff": null,
147
+ "dropout": 0.1,
148
+ "kl_weight": 10.0,
149
+ "optimizer_lr": 1e-05,
150
+ "optimizer_weight_decay": 0.0001,
151
+ "optimizer_lr_backbone": 1e-05
152
+ },
153
+ "output_dir": "/workspace/outputs/train/act_mission3",
154
+ "job_name": "act_mission3",
155
+ "resume": false,
156
+ "seed": 1000,
157
+ "num_workers": 4,
158
+ "batch_size": 64,
159
+ "steps": 10000,
160
+ "eval_freq": 20000,
161
+ "log_freq": 200,
162
+ "save_checkpoint": true,
163
+ "save_freq": 20000,
164
+ "use_policy_training_preset": true,
165
+ "optimizer": {
166
+ "type": "adamw",
167
+ "lr": 1e-05,
168
+ "weight_decay": 0.0001,
169
+ "grad_clip_norm": 10.0,
170
+ "betas": [
171
+ 0.9,
172
+ 0.999
173
+ ],
174
+ "eps": 1e-08
175
+ },
176
+ "scheduler": null,
177
+ "eval": {
178
+ "n_episodes": 50,
179
+ "batch_size": 50,
180
+ "use_async_envs": false
181
+ },
182
+ "wandb": {
183
+ "enable": true,
184
+ "disable_artifact": false,
185
+ "project": "lerobot",
186
+ "entity": null,
187
+ "notes": null,
188
+ "run_id": "fytl4nqj",
189
+ "mode": null
190
+ },
191
+ "checkpoint_path": null,
192
+ "rename_map": {}
193
+ }
checkpoints/010000/training_state/optimizer_param_groups.json ADDED
@@ -0,0 +1,191 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "lr": 1e-05,
4
+ "betas": [
5
+ 0.9,
6
+ 0.999
7
+ ],
8
+ "eps": 1e-08,
9
+ "weight_decay": 0.0001,
10
+ "amsgrad": false,
11
+ "maximize": false,
12
+ "foreach": null,
13
+ "capturable": false,
14
+ "differentiable": false,
15
+ "fused": null,
16
+ "decoupled_weight_decay": true,
17
+ "params": [
18
+ 0,
19
+ 1,
20
+ 2,
21
+ 3,
22
+ 4,
23
+ 5,
24
+ 6,
25
+ 7,
26
+ 8,
27
+ 9,
28
+ 10,
29
+ 11,
30
+ 12,
31
+ 13,
32
+ 14,
33
+ 15,
34
+ 16,
35
+ 17,
36
+ 18,
37
+ 19,
38
+ 20,
39
+ 21,
40
+ 22,
41
+ 23,
42
+ 24,
43
+ 25,
44
+ 26,
45
+ 27,
46
+ 28,
47
+ 29,
48
+ 30,
49
+ 31,
50
+ 32,
51
+ 33,
52
+ 34,
53
+ 35,
54
+ 36,
55
+ 37,
56
+ 38,
57
+ 39,
58
+ 40,
59
+ 41,
60
+ 42,
61
+ 43,
62
+ 44,
63
+ 45,
64
+ 46,
65
+ 47,
66
+ 48,
67
+ 49,
68
+ 50,
69
+ 51,
70
+ 52,
71
+ 53,
72
+ 54,
73
+ 55,
74
+ 56,
75
+ 57,
76
+ 58,
77
+ 59,
78
+ 60,
79
+ 61,
80
+ 62,
81
+ 63,
82
+ 64,
83
+ 65,
84
+ 66,
85
+ 67,
86
+ 68,
87
+ 69,
88
+ 70,
89
+ 71,
90
+ 72,
91
+ 73,
92
+ 74,
93
+ 75,
94
+ 76,
95
+ 77,
96
+ 78,
97
+ 79,
98
+ 80,
99
+ 81,
100
+ 82,
101
+ 83,
102
+ 84,
103
+ 85,
104
+ 86,
105
+ 87,
106
+ 88,
107
+ 89,
108
+ 90,
109
+ 91,
110
+ 92,
111
+ 93,
112
+ 94,
113
+ 95,
114
+ 96,
115
+ 97,
116
+ 98,
117
+ 99,
118
+ 100,
119
+ 101,
120
+ 102,
121
+ 103,
122
+ 104,
123
+ 105,
124
+ 106,
125
+ 107,
126
+ 108,
127
+ 109,
128
+ 110,
129
+ 111,
130
+ 112,
131
+ 113,
132
+ 114,
133
+ 115,
134
+ 116,
135
+ 117,
136
+ 118,
137
+ 119,
138
+ 120,
139
+ 121,
140
+ 122,
141
+ 123,
142
+ 124,
143
+ 125,
144
+ 126,
145
+ 127,
146
+ 128,
147
+ 129,
148
+ 130,
149
+ 131,
150
+ 132
151
+ ]
152
+ },
153
+ {
154
+ "lr": 1e-05,
155
+ "betas": [
156
+ 0.9,
157
+ 0.999
158
+ ],
159
+ "eps": 1e-08,
160
+ "weight_decay": 0.0001,
161
+ "amsgrad": false,
162
+ "maximize": false,
163
+ "foreach": null,
164
+ "capturable": false,
165
+ "differentiable": false,
166
+ "fused": null,
167
+ "decoupled_weight_decay": true,
168
+ "params": [
169
+ 133,
170
+ 134,
171
+ 135,
172
+ 136,
173
+ 137,
174
+ 138,
175
+ 139,
176
+ 140,
177
+ 141,
178
+ 142,
179
+ 143,
180
+ 144,
181
+ 145,
182
+ 146,
183
+ 147,
184
+ 148,
185
+ 149,
186
+ 150,
187
+ 151,
188
+ 152
189
+ ]
190
+ }
191
+ ]
checkpoints/010000/training_state/optimizer_state.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:caf20d46d87f901168c7d57ef6d946cb4301adcb69f7fff50be185e049d5f03b
3
+ size 412817652
checkpoints/010000/training_state/rng_state.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af16b1f3588595c7a9092b22ae03190b728c53b4861905ecf94e7d3dec064191
3
+ size 15708
checkpoints/010000/training_state/training_step.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "step": 10000
3
+ }
wandb/debug-internal.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-12-06T00:54:56.122629742Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
2
+ {"time":"2025-12-06T00:54:56.388333444Z","level":"INFO","msg":"stream: created new stream","id":"fytl4nqj"}
3
+ {"time":"2025-12-06T00:54:56.388353266Z","level":"INFO","msg":"stream: started","id":"fytl4nqj"}
4
+ {"time":"2025-12-06T00:54:56.388365123Z","level":"INFO","msg":"writer: started","stream_id":"fytl4nqj"}
5
+ {"time":"2025-12-06T00:54:56.388376338Z","level":"INFO","msg":"handler: started","stream_id":"fytl4nqj"}
6
+ {"time":"2025-12-06T00:54:56.388405822Z","level":"INFO","msg":"sender: started","stream_id":"fytl4nqj"}
7
+ {"time":"2025-12-06T01:45:24.572319693Z","level":"INFO","msg":"stream: closing","id":"fytl4nqj"}
8
+ {"time":"2025-12-06T01:45:27.662715324Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
9
+ {"time":"2025-12-06T01:45:27.774232349Z","level":"INFO","msg":"handler: closed","stream_id":"fytl4nqj"}
10
+ {"time":"2025-12-06T01:45:27.774287536Z","level":"INFO","msg":"sender: closed","stream_id":"fytl4nqj"}
11
+ {"time":"2025-12-06T01:45:27.774298012Z","level":"INFO","msg":"stream: closed","id":"fytl4nqj"}
wandb/debug.log ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Current SDK version is 0.21.4
2
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Configure stats pid to 9366
3
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Loading settings from /root/.config/wandb/settings
4
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Loading settings from /workspace/wandb/settings
5
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:setup_run_log_directory():686] Logging user logs to /workspace/outputs/train/act_mission3/wandb/run-20251206_005455-fytl4nqj/logs/debug.log
7
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to /workspace/outputs/train/act_mission3/wandb/run-20251206_005455-fytl4nqj/logs/debug-internal.log
8
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:init():813] calling init triggers
9
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'dataset': {'repo_id': 'AmdRamen/mission1_record_edited', 'root': None, 'episodes': None, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'tfs': {'brightness': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'brightness': [0.8, 1.2]}}, 'contrast': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'contrast': [0.8, 1.2]}}, 'saturation': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'saturation': [0.5, 1.5]}}, 'hue': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'hue': [-0.05, 0.05]}}, 'sharpness': {'weight': 1.0, 'type': 'SharpnessJitter', 'kwargs': {'sharpness': [0.5, 1.5]}}, 'affine': {'weight': 1.0, 'type': 'RandomAffine', 'kwargs': {'degrees': [-5.0, 5.0], 'translate': [0.05, 0.05]}}}}, 'revision': None, 'use_imagenet_stats': True, 'video_backend': 'torchcodec', 'streaming': False}, 'env': None, 'policy': {'type': 'act', 'n_obs_steps': 1, 'input_features': {}, 'output_features': {}, 'device': 'cuda', 'use_amp': False, 'push_to_hub': False, 'repo_id': None, 'private': None, 'tags': None, 'license': None, 'pretrained_path': None, 'chunk_size': 100, 'n_action_steps': 100, 'normalization_mapping': {'VISUAL': <NormalizationMode.MEAN_STD: 'MEAN_STD'>, 'STATE': <NormalizationMode.MEAN_STD: 'MEAN_STD'>, 'ACTION': <NormalizationMode.MEAN_STD: 'MEAN_STD'>}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_coeff': None, 'dropout': 0.1, 'kl_weight': 10.0, 'optimizer_lr': 1e-05, 'optimizer_weight_decay': 0.0001, 'optimizer_lr_backbone': 1e-05}, 'output_dir': '/workspace/outputs/train/act_mission3', 'job_name': 'act_mission3', 'resume': False, 'seed': 1000, 'num_workers': 4, 'batch_size': 64, 'steps': 10000, 'eval_freq': 20000, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 20000, 'use_policy_training_preset': True, 'optimizer': {'type': 'adamw', 'lr': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10.0, 'betas': [0.9, 0.999], 'eps': 1e-08}, 'scheduler': None, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot', 'entity': None, 'notes': None, 'run_id': None, 'mode': None}, 'checkpoint_path': None, 'rename_map': {}, '_wandb': {}}
11
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:init():854] starting backend
12
+ 2025-12-06 00:54:56,118 INFO MainThread:9366 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-12-06 00:54:56,120 INFO MainThread:9366 [wandb_init.py:init():865] backend started and connected
14
+ 2025-12-06 00:54:56,121 INFO MainThread:9366 [wandb_init.py:init():936] updated telemetry
15
+ 2025-12-06 00:54:56,121 INFO MainThread:9366 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-12-06 00:54:56,720 INFO MainThread:9366 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_console_start():2506] atexit reg
18
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_redirect():2354] redirect: wrap_raw
19
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_redirect():2423] Wrapping output streams.
20
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_redirect():2446] Redirects installed.
21
+ 2025-12-06 00:54:56,791 INFO MainThread:9366 [wandb_init.py:init():1049] run started, returning control to user process
22
+ 2025-12-06 01:45:24,572 INFO wandb-AsyncioManager-main:9366 [service_client.py:_forward_responses():84] Reached EOF.
23
+ 2025-12-06 01:45:24,572 INFO wandb-AsyncioManager-main:9366 [mailbox.py:close():137] Closing mailbox, abandoning 2 handles.
wandb/run-20251206_005455-fytl4nqj/files/config.yaml ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.21.4
4
+ e:
5
+ wqxdc1w0muy9ke859532t1lmescbho6l:
6
+ args:
7
+ - --dataset.repo_id=AmdRamen/mission1_record_edited
8
+ - --batch_size=64
9
+ - --steps=10000
10
+ - --output_dir=/workspace/outputs/train/act_mission3
11
+ - --job_name=act_mission3
12
+ - --policy.device=cuda
13
+ - --policy.type=act
14
+ - --policy.push_to_hub=false
15
+ - --wandb.enable=true
16
+ cpu_count: 160
17
+ cpu_count_logical: 160
18
+ disk:
19
+ /:
20
+ total: "2162185003008"
21
+ used: "790434836480"
22
+ executable: /opt/venv/bin/python
23
+ gpu: AMD Instinct MI300X VF
24
+ gpu_amd:
25
+ - id: "0"
26
+ maxPower: "750.0"
27
+ mclkRange: 900Mhz - 1300Mhz
28
+ model: "0x74b5"
29
+ performanceLevel: auto
30
+ sclkRange: 500Mhz - 2100Mhz
31
+ series: AMD Instinct MI300X VF
32
+ sku: M3000100
33
+ uniqueId: "0xcc07fb4719633876"
34
+ vbiosVersion: 113-M3000100-103
35
+ vendor: Advanced Micro Devices, Inc. [AMD/ATI]
36
+ gpu_count: 1
37
+ host: robotics-jupyter-launcher-4360
38
+ memory:
39
+ total: "2029207171072"
40
+ os: Linux-6.1.0-39-amd64-x86_64-with-glibc2.39
41
+ program: /opt/venv/bin/lerobot-train
42
+ python: CPython 3.12.3
43
+ root: /workspace/outputs/train/act_mission3
44
+ startedAt: "2025-12-06T00:54:55.913293Z"
45
+ writerId: wqxdc1w0muy9ke859532t1lmescbho6l
46
+ m: []
47
+ python_version: 3.12.3
48
+ t:
49
+ "1":
50
+ - 1
51
+ - 41
52
+ - 49
53
+ - 51
54
+ - 71
55
+ - 83
56
+ "2":
57
+ - 1
58
+ - 41
59
+ - 49
60
+ - 51
61
+ - 71
62
+ - 83
63
+ "3":
64
+ - 13
65
+ - 15
66
+ - 16
67
+ - 61
68
+ "4": 3.12.3
69
+ "5": 0.21.4
70
+ "10":
71
+ - 21
72
+ "12": 0.21.4
73
+ "13": linux-x86_64
74
+ batch_size:
75
+ value: 64
76
+ checkpoint_path:
77
+ value: null
78
+ dataset:
79
+ value:
80
+ episodes: null
81
+ image_transforms:
82
+ enable: false
83
+ max_num_transforms: 3
84
+ random_order: false
85
+ tfs:
86
+ affine:
87
+ kwargs:
88
+ degrees:
89
+ - -5
90
+ - 5
91
+ translate:
92
+ - 0.05
93
+ - 0.05
94
+ type: RandomAffine
95
+ weight: 1
96
+ brightness:
97
+ kwargs:
98
+ brightness:
99
+ - 0.8
100
+ - 1.2
101
+ type: ColorJitter
102
+ weight: 1
103
+ contrast:
104
+ kwargs:
105
+ contrast:
106
+ - 0.8
107
+ - 1.2
108
+ type: ColorJitter
109
+ weight: 1
110
+ hue:
111
+ kwargs:
112
+ hue:
113
+ - -0.05
114
+ - 0.05
115
+ type: ColorJitter
116
+ weight: 1
117
+ saturation:
118
+ kwargs:
119
+ saturation:
120
+ - 0.5
121
+ - 1.5
122
+ type: ColorJitter
123
+ weight: 1
124
+ sharpness:
125
+ kwargs:
126
+ sharpness:
127
+ - 0.5
128
+ - 1.5
129
+ type: SharpnessJitter
130
+ weight: 1
131
+ repo_id: AmdRamen/mission1_record_edited
132
+ revision: null
133
+ root: null
134
+ streaming: false
135
+ use_imagenet_stats: true
136
+ video_backend: torchcodec
137
+ env:
138
+ value: null
139
+ eval:
140
+ value:
141
+ batch_size: 50
142
+ n_episodes: 50
143
+ use_async_envs: false
144
+ eval_freq:
145
+ value: 20000
146
+ job_name:
147
+ value: act_mission3
148
+ log_freq:
149
+ value: 200
150
+ num_workers:
151
+ value: 4
152
+ optimizer:
153
+ value:
154
+ betas:
155
+ - 0.9
156
+ - 0.999
157
+ eps: 1e-08
158
+ grad_clip_norm: 10
159
+ lr: 1e-05
160
+ type: adamw
161
+ weight_decay: 0.0001
162
+ output_dir:
163
+ value: /workspace/outputs/train/act_mission3
164
+ policy:
165
+ value:
166
+ chunk_size: 100
167
+ device: cuda
168
+ dim_feedforward: 3200
169
+ dim_model: 512
170
+ dropout: 0.1
171
+ feedforward_activation: relu
172
+ kl_weight: 10
173
+ latent_dim: 32
174
+ license: null
175
+ n_action_steps: 100
176
+ n_decoder_layers: 1
177
+ n_encoder_layers: 4
178
+ n_heads: 8
179
+ n_obs_steps: 1
180
+ n_vae_encoder_layers: 4
181
+ normalization_mapping:
182
+ ACTION: MEAN_STD
183
+ STATE: MEAN_STD
184
+ VISUAL: MEAN_STD
185
+ optimizer_lr: 1e-05
186
+ optimizer_lr_backbone: 1e-05
187
+ optimizer_weight_decay: 0.0001
188
+ pre_norm: false
189
+ pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1
190
+ pretrained_path: null
191
+ private: null
192
+ push_to_hub: false
193
+ replace_final_stride_with_dilation: false
194
+ repo_id: null
195
+ tags: null
196
+ temporal_ensemble_coeff: null
197
+ type: act
198
+ use_amp: false
199
+ use_vae: true
200
+ vision_backbone: resnet18
201
+ resume:
202
+ value: false
203
+ save_checkpoint:
204
+ value: true
205
+ save_freq:
206
+ value: 20000
207
+ scheduler:
208
+ value: null
209
+ seed:
210
+ value: 1000
211
+ steps:
212
+ value: 10000
213
+ use_policy_training_preset:
214
+ value: true
215
+ wandb:
216
+ value:
217
+ disable_artifact: false
218
+ enable: true
219
+ entity: null
220
+ mode: null
221
+ notes: null
222
+ project: lerobot
223
+ run_id: null
wandb/run-20251206_005455-fytl4nqj/files/output.log ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ INFO 2025-12-06 00:54:56 db_utils.py:102 Logs will be synced with wandb.
2
+ INFO 2025-12-06 00:54:56 db_utils.py:103 Track this run --> https://wandb.ai/amd_hackathon_ramen/lerobot/runs/fytl4nqj
3
+ INFO 2025-12-06 00:54:56 ot_train.py:183 Creating dataset
4
+ INFO 2025-12-06 00:54:56 ot_train.py:202 Creating policy
5
+ INFO 2025-12-06 00:54:57 ot_train.py:247 Creating optimizer and scheduler
6
+ INFO 2025-12-06 00:54:57 ot_train.py:259 Output dir: /workspace/outputs/train/act_mission3
7
+ INFO 2025-12-06 00:54:57 ot_train.py:262 cfg.steps=10000 (10K)
8
+ INFO 2025-12-06 00:54:57 ot_train.py:263 dataset.num_frames=10351 (10K)
9
+ INFO 2025-12-06 00:54:57 ot_train.py:264 dataset.num_episodes=18
10
+ INFO 2025-12-06 00:54:57 ot_train.py:267 Effective batch size: 64 x 1 = 64
11
+ INFO 2025-12-06 00:54:57 ot_train.py:268 num_learnable_params=51597190 (52M)
12
+ INFO 2025-12-06 00:54:57 ot_train.py:269 num_total_params=51597190 (52M)
13
+ INFO 2025-12-06 00:54:57 ot_train.py:324 Start offline training on a fixed dataset
14
+ INFO 2025-12-06 00:57:16 ot_train.py:351 step:200 smpl:13K ep:22 epch:1.24 loss:5.418 grdn:78.522 lr:1.0e-05 updt_s:0.651 data_s:0.043
15
+ INFO 2025-12-06 00:58:13 ot_train.py:351 step:400 smpl:26K ep:45 epch:2.47 loss:2.053 grdn:34.066 lr:1.0e-05 updt_s:0.254 data_s:0.029
16
+ INFO 2025-12-06 00:59:09 ot_train.py:351 step:600 smpl:38K ep:67 epch:3.71 loss:1.573 grdn:33.456 lr:1.0e-05 updt_s:0.253 data_s:0.030
17
+ INFO 2025-12-06 01:00:07 ot_train.py:351 step:800 smpl:51K ep:89 epch:4.95 loss:1.231 grdn:28.238 lr:1.0e-05 updt_s:0.253 data_s:0.032
18
+ INFO 2025-12-06 01:01:09 ot_train.py:351 step:1K smpl:64K ep:111 epch:6.18 loss:0.968 grdn:24.788 lr:1.0e-05 updt_s:0.252 data_s:0.060
19
+ INFO 2025-12-06 01:02:06 ot_train.py:351 step:1K smpl:77K ep:134 epch:7.42 loss:0.771 grdn:23.083 lr:1.0e-05 updt_s:0.253 data_s:0.032
20
+ INFO 2025-12-06 01:03:04 ot_train.py:351 step:1K smpl:90K ep:156 epch:8.66 loss:0.610 grdn:20.872 lr:1.0e-05 updt_s:0.253 data_s:0.034
21
+ INFO 2025-12-06 01:04:01 ot_train.py:351 step:2K smpl:102K ep:178 epch:9.89 loss:0.492 grdn:19.151 lr:1.0e-05 updt_s:0.253 data_s:0.032
22
+ INFO 2025-12-06 01:05:03 ot_train.py:351 step:2K smpl:115K ep:200 epch:11.13 loss:0.400 grdn:17.442 lr:1.0e-05 updt_s:0.254 data_s:0.059
23
+ INFO 2025-12-06 01:06:00 ot_train.py:351 step:2K smpl:128K ep:223 epch:12.37 loss:0.331 grdn:15.961 lr:1.0e-05 updt_s:0.253 data_s:0.033
24
+ INFO 2025-12-06 01:06:58 ot_train.py:351 step:2K smpl:141K ep:245 epch:13.60 loss:0.281 grdn:15.139 lr:1.0e-05 updt_s:0.253 data_s:0.036
25
+ INFO 2025-12-06 01:07:56 ot_train.py:351 step:2K smpl:154K ep:267 epch:14.84 loss:0.244 grdn:13.705 lr:1.0e-05 updt_s:0.253 data_s:0.038
26
+ INFO 2025-12-06 01:09:00 ot_train.py:351 step:3K smpl:166K ep:289 epch:16.08 loss:0.216 grdn:13.436 lr:1.0e-05 updt_s:0.253 data_s:0.063
27
+ INFO 2025-12-06 01:09:57 ot_train.py:351 step:3K smpl:179K ep:312 epch:17.31 loss:0.196 grdn:12.866 lr:1.0e-05 updt_s:0.253 data_s:0.036
28
+ INFO 2025-12-06 01:10:55 ot_train.py:351 step:3K smpl:192K ep:334 epch:18.55 loss:0.179 grdn:12.783 lr:1.0e-05 updt_s:0.254 data_s:0.035
29
+ INFO 2025-12-06 01:11:53 ot_train.py:351 step:3K smpl:205K ep:356 epch:19.79 loss:0.166 grdn:11.441 lr:1.0e-05 updt_s:0.252 data_s:0.035
30
+ INFO 2025-12-06 01:12:50 ot_train.py:351 step:3K smpl:218K ep:378 epch:21.02 loss:0.155 grdn:11.232 lr:1.0e-05 updt_s:0.252 data_s:0.035
31
+ INFO 2025-12-06 01:13:52 ot_train.py:351 step:4K smpl:230K ep:401 epch:22.26 loss:0.146 grdn:11.090 lr:1.0e-05 updt_s:0.253 data_s:0.059
32
+ INFO 2025-12-06 01:14:50 ot_train.py:351 step:4K smpl:243K ep:423 epch:23.50 loss:0.137 grdn:10.513 lr:1.0e-05 updt_s:0.253 data_s:0.035
33
+ INFO 2025-12-06 01:15:48 ot_train.py:351 step:4K smpl:256K ep:445 epch:24.73 loss:0.131 grdn:10.420 lr:1.0e-05 updt_s:0.253 data_s:0.036
34
+ INFO 2025-12-06 01:16:46 ot_train.py:351 step:4K smpl:269K ep:467 epch:25.97 loss:0.125 grdn:10.228 lr:1.0e-05 updt_s:0.253 data_s:0.038
35
+ INFO 2025-12-06 01:17:50 ot_train.py:351 step:4K smpl:282K ep:490 epch:27.21 loss:0.120 grdn:10.026 lr:1.0e-05 updt_s:0.253 data_s:0.063
36
+ INFO 2025-12-06 01:18:46 ot_train.py:351 step:5K smpl:294K ep:512 epch:28.44 loss:0.114 grdn:8.895 lr:1.0e-05 updt_s:0.253 data_s:0.031
37
+ INFO 2025-12-06 01:19:44 ot_train.py:351 step:5K smpl:307K ep:534 epch:29.68 loss:0.110 grdn:9.179 lr:1.0e-05 updt_s:0.252 data_s:0.037
38
+ INFO 2025-12-06 01:20:42 ot_train.py:351 step:5K smpl:320K ep:556 epch:30.91 loss:0.107 grdn:8.854 lr:1.0e-05 updt_s:0.253 data_s:0.037
39
+ INFO 2025-12-06 01:21:46 ot_train.py:351 step:5K smpl:333K ep:579 epch:32.15 loss:0.103 grdn:8.752 lr:1.0e-05 updt_s:0.253 data_s:0.065
40
+ INFO 2025-12-06 01:22:44 ot_train.py:351 step:5K smpl:346K ep:601 epch:33.39 loss:0.100 grdn:9.187 lr:1.0e-05 updt_s:0.254 data_s:0.036
41
+ INFO 2025-12-06 01:23:42 ot_train.py:351 step:6K smpl:358K ep:623 epch:34.62 loss:0.097 grdn:8.771 lr:1.0e-05 updt_s:0.253 data_s:0.035
42
+ INFO 2025-12-06 01:24:39 ot_train.py:351 step:6K smpl:371K ep:646 epch:35.86 loss:0.094 grdn:8.387 lr:1.0e-05 updt_s:0.252 data_s:0.034
43
+ INFO 2025-12-06 01:25:42 ot_train.py:351 step:6K smpl:384K ep:668 epch:37.10 loss:0.091 grdn:8.157 lr:1.0e-05 updt_s:0.252 data_s:0.063
44
+ INFO 2025-12-06 01:26:40 ot_train.py:351 step:6K smpl:397K ep:690 epch:38.33 loss:0.089 grdn:8.513 lr:1.0e-05 updt_s:0.253 data_s:0.036
45
+ INFO 2025-12-06 01:27:38 ot_train.py:351 step:6K smpl:410K ep:712 epch:39.57 loss:0.087 grdn:7.939 lr:1.0e-05 updt_s:0.253 data_s:0.039
46
+ INFO 2025-12-06 01:28:37 ot_train.py:351 step:7K smpl:422K ep:735 epch:40.81 loss:0.085 grdn:8.116 lr:1.0e-05 updt_s:0.254 data_s:0.038
47
+ INFO 2025-12-06 01:29:34 ot_train.py:351 step:7K smpl:435K ep:757 epch:42.04 loss:0.083 grdn:7.877 lr:1.0e-05 updt_s:0.252 data_s:0.036
48
+ INFO 2025-12-06 01:30:38 ot_train.py:351 step:7K smpl:448K ep:779 epch:43.28 loss:0.082 grdn:8.333 lr:1.0e-05 updt_s:0.253 data_s:0.063
49
+ INFO 2025-12-06 01:31:36 ot_train.py:351 step:7K smpl:461K ep:801 epch:44.52 loss:0.079 grdn:7.639 lr:1.0e-05 updt_s:0.253 data_s:0.037
50
+ INFO 2025-12-06 01:32:33 ot_train.py:351 step:7K smpl:474K ep:824 epch:45.75 loss:0.077 grdn:7.156 lr:1.0e-05 updt_s:0.253 data_s:0.036
51
+ INFO 2025-12-06 01:33:32 ot_train.py:351 step:8K smpl:486K ep:846 epch:46.99 loss:0.076 grdn:7.710 lr:1.0e-05 updt_s:0.253 data_s:0.039
52
+ INFO 2025-12-06 01:34:35 ot_train.py:351 step:8K smpl:499K ep:868 epch:48.23 loss:0.074 grdn:7.208 lr:1.0e-05 updt_s:0.254 data_s:0.063
53
+ INFO 2025-12-06 01:35:32 ot_train.py:351 step:8K smpl:512K ep:890 epch:49.46 loss:0.072 grdn:7.147 lr:1.0e-05 updt_s:0.253 data_s:0.032
54
+ INFO 2025-12-06 01:36:30 ot_train.py:351 step:8K smpl:525K ep:913 epch:50.70 loss:0.072 grdn:7.424 lr:1.0e-05 updt_s:0.253 data_s:0.038
55
+ INFO 2025-12-06 01:37:29 ot_train.py:351 step:8K smpl:538K ep:935 epch:51.94 loss:0.070 grdn:6.816 lr:1.0e-05 updt_s:0.253 data_s:0.039
56
+ INFO 2025-12-06 01:38:32 ot_train.py:351 step:9K smpl:550K ep:957 epch:53.17 loss:0.068 grdn:6.631 lr:1.0e-05 updt_s:0.252 data_s:0.062
57
+ INFO 2025-12-06 01:39:29 ot_train.py:351 step:9K smpl:563K ep:979 epch:54.41 loss:0.067 grdn:6.769 lr:1.0e-05 updt_s:0.253 data_s:0.034
58
+ INFO 2025-12-06 01:40:27 ot_train.py:351 step:9K smpl:576K ep:1K epch:55.65 loss:0.067 grdn:6.859 lr:1.0e-05 updt_s:0.253 data_s:0.037
59
+ INFO 2025-12-06 01:41:25 ot_train.py:351 step:9K smpl:589K ep:1K epch:56.88 loss:0.065 grdn:6.630 lr:1.0e-05 updt_s:0.254 data_s:0.036
60
+ INFO 2025-12-06 01:42:29 ot_train.py:351 step:9K smpl:602K ep:1K epch:58.12 loss:0.064 grdn:6.299 lr:1.0e-05 updt_s:0.252 data_s:0.065
61
+ INFO 2025-12-06 01:43:26 ot_train.py:351 step:10K smpl:614K ep:1K epch:59.36 loss:0.063 grdn:6.792 lr:1.0e-05 updt_s:0.253 data_s:0.035
62
+ INFO 2025-12-06 01:44:24 ot_train.py:351 step:10K smpl:627K ep:1K epch:60.59 loss:0.062 grdn:6.748 lr:1.0e-05 updt_s:0.253 data_s:0.036
63
+ INFO 2025-12-06 01:45:22 ot_train.py:351 step:10K smpl:640K ep:1K epch:61.83 loss:0.061 grdn:6.405 lr:1.0e-05 updt_s:0.253 data_s:0.037
64
+ INFO 2025-12-06 01:45:22 ot_train.py:361 Checkpoint policy after step 10000
65
+ INFO 2025-12-06 01:45:24 ot_train.py:430 End of training
wandb/run-20251206_005455-fytl4nqj/files/requirements.txt ADDED
@@ -0,0 +1,185 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ pip==25.2
2
+ setuptools==80.9.0
3
+ zipp==3.23.0
4
+ jupyter_core==5.9.1
5
+ rpds-py==0.30.0
6
+ terminado==0.18.1
7
+ ihighlight==1.0.0
8
+ rfc3986-validator==0.1.1
9
+ pure_eval==0.2.3
10
+ ImageIO==2.37.2
11
+ dill==0.4.0
12
+ prompt_toolkit==3.0.52
13
+ httpx==0.28.1
14
+ cmake==4.1.3
15
+ jupyter-console==6.6.3
16
+ jsonschema==4.25.1
17
+ torchcodec==0.5
18
+ nbclient==0.10.2
19
+ h11==0.16.0
20
+ mistune==3.1.4
21
+ pydantic==2.12.5
22
+ jupyter_server_terminals==0.5.3
23
+ arrow==1.4.0
24
+ av==15.1.0
25
+ python-xlib==0.33
26
+ mergedeep==1.3.4
27
+ ipywidgets==8.1.8
28
+ sentry-sdk==2.47.0
29
+ matplotlib-inline==0.2.1
30
+ jupyterlab_pygments==0.3.0
31
+ toml==0.10.2
32
+ multidict==6.7.0
33
+ jupyter-lsp==2.3.0
34
+ imageio-ffmpeg==0.6.0
35
+ babel==2.17.0
36
+ typing-inspection==0.4.2
37
+ jsonschema-specifications==2025.9.1
38
+ isoduration==20.11.0
39
+ aiosignal==1.4.0
40
+ rfc3987-syntax==1.1.0
41
+ psutil==7.1.3
42
+ einops==0.8.1
43
+ argon2-cffi==25.1.0
44
+ aiohttp==3.13.2
45
+ pyyaml-include==1.4.1
46
+ nbformat==5.10.4
47
+ urllib3==2.5.0
48
+ multiprocess==0.70.16
49
+ inquirerpy==0.3.4
50
+ click==8.3.1
51
+ asttokens==3.0.1
52
+ draccus==0.10.0
53
+ ipython==9.8.0
54
+ pexpect==4.9.0
55
+ deepdiff==8.6.1
56
+ xxhash==3.6.0
57
+ rerun-sdk==0.26.2
58
+ pandocfilters==1.5.1
59
+ jedi==0.19.2
60
+ mypy_extensions==1.1.0
61
+ orderly-set==5.5.0
62
+ async-lru==2.0.5
63
+ fqdn==1.5.1
64
+ fastjsonschema==2.21.2
65
+ uri-template==1.3.0
66
+ GitPython==3.1.45
67
+ aiohappyeyeballs==2.6.1
68
+ jupyterlab==4.5.0
69
+ protobuf==6.33.1
70
+ evdev==1.9.2
71
+ anyio==4.12.0
72
+ requests==2.32.5
73
+ argon2-cffi-bindings==25.1.0
74
+ typing-inspect==0.9.0
75
+ charset-normalizer==3.4.4
76
+ webcolors==25.10.0
77
+ pyzmq==27.1.0
78
+ comm==0.2.3
79
+ notebook==7.5.0
80
+ defusedxml==0.7.1
81
+ jupyter-events==0.12.0
82
+ cloudpickle==3.1.2
83
+ propcache==0.4.1
84
+ jupyter_client==8.6.3
85
+ ptyprocess==0.7.0
86
+ widgetsnbextension==4.0.15
87
+ importlib_metadata==8.7.0
88
+ frozenlist==1.8.0
89
+ websocket-client==1.9.0
90
+ pydantic_core==2.41.5
91
+ jupyterlab_server==2.28.0
92
+ json5==0.12.1
93
+ certifi==2025.11.12
94
+ ipykernel==7.1.0
95
+ nbconvert==7.16.6
96
+ decorator==5.2.1
97
+ gymnasium==1.2.2
98
+ jupyterlab_widgets==3.0.16
99
+ notebook_shim==0.2.4
100
+ accelerate==1.12.0
101
+ pyarrow==22.0.0
102
+ regex==2025.11.3
103
+ parso==0.8.5
104
+ tinycss2==1.4.0
105
+ jupyter_server==2.17.0
106
+ debugpy==1.8.17
107
+ lark==1.3.1
108
+ annotated-types==0.7.0
109
+ idna==3.11
110
+ yarl==1.22.0
111
+ jupyter==1.1.1
112
+ diffusers==0.35.2
113
+ gitdb==4.0.12
114
+ termcolor==3.2.0
115
+ bleach==6.3.0
116
+ beautifulsoup4==4.14.3
117
+ attrs==25.4.0
118
+ pyserial==3.5
119
+ tornado==6.5.2
120
+ opencv-python-headless==4.12.0.88
121
+ rfc3339-validator==0.1.4
122
+ referencing==0.37.0
123
+ python-json-logger==4.0.0
124
+ numpy==2.2.6
125
+ pfzy==0.3.4
126
+ executing==2.2.1
127
+ smmap==5.0.2
128
+ httpcore==1.0.9
129
+ pynput==1.8.1
130
+ nest-asyncio==1.6.0
131
+ hf-xet==1.2.0
132
+ cffi==2.0.0
133
+ ipython_pygments_lexers==1.1.1
134
+ stack-data==0.6.3
135
+ wcwidth==0.2.14
136
+ jsonpointer==3.0.0
137
+ prometheus_client==0.23.1
138
+ safetensors==0.7.0
139
+ datasets==4.1.1
140
+ platformdirs==4.5.0
141
+ soupsieve==2.8
142
+ jsonlines==4.0.0
143
+ webencodings==0.5.1
144
+ Send2Trash==1.8.3
145
+ traitlets==5.14.3
146
+ huggingface-hub==0.35.3
147
+ hf_transfer==0.1.9
148
+ lerobot==0.4.1
149
+ wandb==0.21.4
150
+ pycparser==2.23
151
+ Farama-Notifications==0.0.4
152
+ Jinja2==3.1.6
153
+ iniconfig==2.1.0
154
+ apex==1.7.0a0+rocm7.0.0.git20a62dc5
155
+ matplotlib==3.10.6
156
+ tzdata==2025.2
157
+ pytorch-triton-rocm==3.3.1+rocm7.0.0.git9c7bc0a3
158
+ pyparsing==3.2.4
159
+ Pygments==2.19.2
160
+ fsspec==2025.9.0
161
+ pytest==8.4.2
162
+ cycler==0.12.1
163
+ networkx==3.5
164
+ python-dateutil==2.9.0.post0
165
+ MarkupSafe==3.0.2
166
+ six==1.17.0
167
+ pluggy==1.6.0
168
+ sympy==1.14.0
169
+ torchaudio==2.7.1+rocm7.0.0.git95c61b41
170
+ fonttools==4.60.0
171
+ packaging==25.0
172
+ tqdm==4.67.1
173
+ PyYAML==6.0.2
174
+ pillow==11.3.0
175
+ filelock==3.19.1
176
+ cxxfilt==0.3.0
177
+ contourpy==1.3.3
178
+ pytz==2025.2
179
+ typing_extensions==4.15.0
180
+ kiwisolver==1.4.9
181
+ torchvision==0.22.1+rocm7.0.0.git59a3e1f9
182
+ pandas==2.3.2
183
+ torch==2.7.1+rocm7.0.0.lw.git698b58a9
184
+ mpmath==1.3.0
185
+ lerobot==0.4.1
wandb/run-20251206_005455-fytl4nqj/files/wandb-metadata.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.1.0-39-amd64-x86_64-with-glibc2.39",
3
+ "python": "CPython 3.12.3",
4
+ "startedAt": "2025-12-06T00:54:55.913293Z",
5
+ "args": [
6
+ "--dataset.repo_id=AmdRamen/mission1_record_edited",
7
+ "--batch_size=64",
8
+ "--steps=10000",
9
+ "--output_dir=/workspace/outputs/train/act_mission3",
10
+ "--job_name=act_mission3",
11
+ "--policy.device=cuda",
12
+ "--policy.type=act",
13
+ "--policy.push_to_hub=false",
14
+ "--wandb.enable=true"
15
+ ],
16
+ "program": "/opt/venv/bin/lerobot-train",
17
+ "root": "/workspace/outputs/train/act_mission3",
18
+ "host": "robotics-jupyter-launcher-4360",
19
+ "executable": "/opt/venv/bin/python",
20
+ "cpu_count": 160,
21
+ "cpu_count_logical": 160,
22
+ "gpu": "AMD Instinct MI300X VF",
23
+ "gpu_count": 1,
24
+ "disk": {
25
+ "/": {
26
+ "total": "2162185003008",
27
+ "used": "790434836480"
28
+ }
29
+ },
30
+ "memory": {
31
+ "total": "2029207171072"
32
+ },
33
+ "gpu_amd": [
34
+ {
35
+ "id": "0",
36
+ "uniqueId": "0xcc07fb4719633876",
37
+ "vbiosVersion": "113-M3000100-103",
38
+ "performanceLevel": "auto",
39
+ "maxPower": "750.0",
40
+ "series": "AMD Instinct MI300X VF",
41
+ "model": "0x74b5",
42
+ "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]",
43
+ "sku": "M3000100",
44
+ "sclkRange": "500Mhz - 2100Mhz",
45
+ "mclkRange": "900Mhz - 1300Mhz"
46
+ }
47
+ ],
48
+ "writerId": "wqxdc1w0muy9ke859532t1lmescbho6l"
49
+ }
wandb/run-20251206_005455-fytl4nqj/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/l1_loss":0.0473325289785862,"_timestamp":1.7649855228125236e+09,"train/loss":0.06111601183190942,"train/grad_norm":6.405067704916,"_runtime":3027.850858097,"_wandb":{"runtime":3027},"train/episodes":1112.9359482175635,"train/epochs":61.82977490097575,"train/kld_loss":0.0008820029906928539,"train/dataloading_s":0.03713882846292108,"train/lr":1.0000000000000021e-05,"train/update_s":0.2526892183267046,"train/steps":10000,"train/samples":640000,"_step":10000}
wandb/run-20251206_005455-fytl4nqj/logs/debug-core.log ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-12-06T00:54:55.93081413Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpkii71jgw/port-9366.txt","pid":9366,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2025-12-06T00:54:55.931195147Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":9366}
3
+ {"time":"2025-12-06T00:54:55.931189539Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-9366-9438-2900896354/socket","Net":"unix"}}
4
+ {"time":"2025-12-06T00:54:56.11841604Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2025-12-06T00:54:56.12255009Z","level":"INFO","msg":"handleInformInit: received","streamId":"fytl4nqj","id":"1(@)"}
6
+ {"time":"2025-12-06T00:54:56.388356121Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"fytl4nqj","id":"1(@)"}
7
+ {"time":"2025-12-06T01:45:24.572267009Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2025-12-06T01:45:24.572328963Z","level":"INFO","msg":"server is shutting down"}
9
+ {"time":"2025-12-06T01:45:24.57231869Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
+ {"time":"2025-12-06T01:45:24.572421458Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-9366-9438-2900896354/socket","Net":"unix"}}
11
+ {"time":"2025-12-06T01:45:24.573067197Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
12
+ {"time":"2025-12-06T01:45:27.612086669Z","level":"ERROR","msg":"processOutgoingData: flush error","error":"write unix /tmp/wandb-9366-9438-2900896354/socket->@: use of closed network connection","id":"1(@)"}
13
+ {"time":"2025-12-06T01:45:27.77560418Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
14
+ {"time":"2025-12-06T01:45:27.775619049Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
15
+ {"time":"2025-12-06T01:45:27.775628326Z","level":"INFO","msg":"server is closed"}
wandb/run-20251206_005455-fytl4nqj/logs/debug-internal.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2025-12-06T00:54:56.122629742Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"}
2
+ {"time":"2025-12-06T00:54:56.388333444Z","level":"INFO","msg":"stream: created new stream","id":"fytl4nqj"}
3
+ {"time":"2025-12-06T00:54:56.388353266Z","level":"INFO","msg":"stream: started","id":"fytl4nqj"}
4
+ {"time":"2025-12-06T00:54:56.388365123Z","level":"INFO","msg":"writer: started","stream_id":"fytl4nqj"}
5
+ {"time":"2025-12-06T00:54:56.388376338Z","level":"INFO","msg":"handler: started","stream_id":"fytl4nqj"}
6
+ {"time":"2025-12-06T00:54:56.388405822Z","level":"INFO","msg":"sender: started","stream_id":"fytl4nqj"}
7
+ {"time":"2025-12-06T01:45:24.572319693Z","level":"INFO","msg":"stream: closing","id":"fytl4nqj"}
8
+ {"time":"2025-12-06T01:45:27.662715324Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
9
+ {"time":"2025-12-06T01:45:27.774232349Z","level":"INFO","msg":"handler: closed","stream_id":"fytl4nqj"}
10
+ {"time":"2025-12-06T01:45:27.774287536Z","level":"INFO","msg":"sender: closed","stream_id":"fytl4nqj"}
11
+ {"time":"2025-12-06T01:45:27.774298012Z","level":"INFO","msg":"stream: closed","id":"fytl4nqj"}
wandb/run-20251206_005455-fytl4nqj/logs/debug.log ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Current SDK version is 0.21.4
2
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Configure stats pid to 9366
3
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Loading settings from /root/.config/wandb/settings
4
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Loading settings from /workspace/wandb/settings
5
+ 2025-12-06 00:54:55,913 INFO MainThread:9366 [wandb_setup.py:_flush():81] Loading settings from environment variables
6
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:setup_run_log_directory():686] Logging user logs to /workspace/outputs/train/act_mission3/wandb/run-20251206_005455-fytl4nqj/logs/debug.log
7
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:setup_run_log_directory():687] Logging internal logs to /workspace/outputs/train/act_mission3/wandb/run-20251206_005455-fytl4nqj/logs/debug-internal.log
8
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:init():813] calling init triggers
9
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:init():818] wandb.init called with sweep_config: {}
10
+ config: {'dataset': {'repo_id': 'AmdRamen/mission1_record_edited', 'root': None, 'episodes': None, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'tfs': {'brightness': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'brightness': [0.8, 1.2]}}, 'contrast': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'contrast': [0.8, 1.2]}}, 'saturation': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'saturation': [0.5, 1.5]}}, 'hue': {'weight': 1.0, 'type': 'ColorJitter', 'kwargs': {'hue': [-0.05, 0.05]}}, 'sharpness': {'weight': 1.0, 'type': 'SharpnessJitter', 'kwargs': {'sharpness': [0.5, 1.5]}}, 'affine': {'weight': 1.0, 'type': 'RandomAffine', 'kwargs': {'degrees': [-5.0, 5.0], 'translate': [0.05, 0.05]}}}}, 'revision': None, 'use_imagenet_stats': True, 'video_backend': 'torchcodec', 'streaming': False}, 'env': None, 'policy': {'type': 'act', 'n_obs_steps': 1, 'input_features': {}, 'output_features': {}, 'device': 'cuda', 'use_amp': False, 'push_to_hub': False, 'repo_id': None, 'private': None, 'tags': None, 'license': None, 'pretrained_path': None, 'chunk_size': 100, 'n_action_steps': 100, 'normalization_mapping': {'VISUAL': <NormalizationMode.MEAN_STD: 'MEAN_STD'>, 'STATE': <NormalizationMode.MEAN_STD: 'MEAN_STD'>, 'ACTION': <NormalizationMode.MEAN_STD: 'MEAN_STD'>}, 'vision_backbone': 'resnet18', 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'replace_final_stride_with_dilation': False, 'pre_norm': False, 'dim_model': 512, 'n_heads': 8, 'dim_feedforward': 3200, 'feedforward_activation': 'relu', 'n_encoder_layers': 4, 'n_decoder_layers': 1, 'use_vae': True, 'latent_dim': 32, 'n_vae_encoder_layers': 4, 'temporal_ensemble_coeff': None, 'dropout': 0.1, 'kl_weight': 10.0, 'optimizer_lr': 1e-05, 'optimizer_weight_decay': 0.0001, 'optimizer_lr_backbone': 1e-05}, 'output_dir': '/workspace/outputs/train/act_mission3', 'job_name': 'act_mission3', 'resume': False, 'seed': 1000, 'num_workers': 4, 'batch_size': 64, 'steps': 10000, 'eval_freq': 20000, 'log_freq': 200, 'save_checkpoint': True, 'save_freq': 20000, 'use_policy_training_preset': True, 'optimizer': {'type': 'adamw', 'lr': 1e-05, 'weight_decay': 0.0001, 'grad_clip_norm': 10.0, 'betas': [0.9, 0.999], 'eps': 1e-08}, 'scheduler': None, 'eval': {'n_episodes': 50, 'batch_size': 50, 'use_async_envs': False}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot', 'entity': None, 'notes': None, 'run_id': None, 'mode': None}, 'checkpoint_path': None, 'rename_map': {}, '_wandb': {}}
11
+ 2025-12-06 00:54:55,914 INFO MainThread:9366 [wandb_init.py:init():854] starting backend
12
+ 2025-12-06 00:54:56,118 INFO MainThread:9366 [wandb_init.py:init():857] sending inform_init request
13
+ 2025-12-06 00:54:56,120 INFO MainThread:9366 [wandb_init.py:init():865] backend started and connected
14
+ 2025-12-06 00:54:56,121 INFO MainThread:9366 [wandb_init.py:init():936] updated telemetry
15
+ 2025-12-06 00:54:56,121 INFO MainThread:9366 [wandb_init.py:init():960] communicating run to backend with 90.0 second timeout
16
+ 2025-12-06 00:54:56,720 INFO MainThread:9366 [wandb_init.py:init():1011] starting run threads in backend
17
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_console_start():2506] atexit reg
18
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_redirect():2354] redirect: wrap_raw
19
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_redirect():2423] Wrapping output streams.
20
+ 2025-12-06 00:54:56,790 INFO MainThread:9366 [wandb_run.py:_redirect():2446] Redirects installed.
21
+ 2025-12-06 00:54:56,791 INFO MainThread:9366 [wandb_init.py:init():1049] run started, returning control to user process
22
+ 2025-12-06 01:45:24,572 INFO wandb-AsyncioManager-main:9366 [service_client.py:_forward_responses():84] Reached EOF.
23
+ 2025-12-06 01:45:24,572 INFO wandb-AsyncioManager-main:9366 [mailbox.py:close():137] Closing mailbox, abandoning 2 handles.
wandb/run-20251206_005455-fytl4nqj/run-fytl4nqj.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:898e7b7ef010af586c96184d609d2e00a225bc66a82d5c68c7f0d83d8b4441d9
3
+ size 207150