lookas commited on
Commit
9e97b8e
·
verified ·
1 Parent(s): d31786f

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +4 -0
  2. .gitignore +1 -0
  3. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/config.yaml +71 -0
  4. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/dataset_statistics.json +264 -0
  5. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/run_qwen3vl_bridge_rt1_qwen_gr00t.sh +62 -0
  6. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/summary.jsonl +4 -0
  7. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug-internal.log +18 -0
  8. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug.log +0 -0
  9. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/output.log +0 -0
  10. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/requirements.txt +190 -0
  11. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/wandb-metadata.json +122 -0
  12. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug-internal.log +18 -0
  13. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug.log +0 -0
  14. qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/run-xgfaxrjd.wandb +3 -0
  15. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/config.yaml +71 -0
  16. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/dataset_statistics.json +264 -0
  17. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/run_qwen3vl_bridge_rt1_qwen_gr00t.sh +62 -0
  18. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/summary.jsonl +10 -0
  19. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug-internal.log +89 -0
  20. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug.log +0 -0
  21. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/config.yaml +133 -0
  22. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/output.log +0 -0
  23. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/requirements.txt +190 -0
  24. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-metadata.json +122 -0
  25. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-summary.json +1 -0
  26. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug-internal.log +89 -0
  27. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug.log +0 -0
  28. qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/run-xbap43rk.wandb +3 -0
  29. qwen3vl_bridge_rt1_QwenOFT_0112_1323/config.yaml +51 -0
  30. qwen3vl_bridge_rt1_QwenOFT_0112_1323/dataset_statistics.json +264 -0
  31. qwen3vl_bridge_rt1_QwenOFT_0112_1323/run_qwen3vl_bridge_rt1_qwen_oft.sh +62 -0
  32. qwen3vl_bridge_rt1_QwenOFT_0112_1323/summary.jsonl +10 -0
  33. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug-internal.log +78 -0
  34. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug.log +0 -0
  35. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/config.yaml +133 -0
  36. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/output.log +0 -0
  37. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/requirements.txt +190 -0
  38. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-metadata.json +122 -0
  39. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-summary.json +1 -0
  40. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug-internal.log +78 -0
  41. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug.log +0 -0
  42. qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/run-ueywjhk5.wandb +3 -0
  43. qwen3vl_bridge_rt1_QwenOFT_0117_1748/config.yaml +51 -0
  44. qwen3vl_bridge_rt1_QwenOFT_0117_1748/dataset_statistics.json +264 -0
  45. qwen3vl_bridge_rt1_QwenOFT_0117_1748/run_qwen3vl_bridge_rt1_qwen_oft.sh +62 -0
  46. qwen3vl_bridge_rt1_QwenOFT_0117_1748/summary.jsonl +10 -0
  47. qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug-internal.log +25 -0
  48. qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug.log +0 -0
  49. qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/config.yaml +133 -0
  50. qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/output.log +0 -0
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/run-xgfaxrjd.wandb filter=lfs diff=lfs merge=lfs -text
37
+ qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/run-xbap43rk.wandb filter=lfs diff=lfs merge=lfs -text
38
+ qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/run-ueywjhk5.wandb filter=lfs diff=lfs merge=lfs -text
39
+ qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/run-rqrn3qyr.wandb filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ wandb
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/config.yaml ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
4
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
5
+ data_mix: bridge_rt_1
6
+ data_root_dir: ./playground/Datasets/OXE_LEROBOT
7
+ dataset_py: lerobot_datasets
8
+ image_size:
9
+ - 224
10
+ - 224
11
+ per_device_batch_size: 8
12
+ video_backend: torchvision_av
13
+ framework:
14
+ action_model:
15
+ action_dim: 7
16
+ action_horizon: 16
17
+ action_model_type: DiT-B
18
+ add_pos_embed: true
19
+ diffusion_model_cfg:
20
+ cross_attention_dim: 4096
21
+ dropout: 0.2
22
+ final_dropout: true
23
+ interleave_self_attention: true
24
+ norm_type: ada_norm
25
+ num_layers: 16
26
+ output_dim: 1024
27
+ positional_embeddings: null
28
+ future_action_window_size: 15
29
+ hidden_size: 1024
30
+ max_seq_len: 1024
31
+ noise_beta_alpha: 1.5
32
+ noise_beta_beta: 1.0
33
+ noise_s: 0.999
34
+ num_inference_timesteps: 4
35
+ num_target_vision_tokens: 32
36
+ num_timestep_buckets: 1000
37
+ past_action_window_size: 0
38
+ state_dim: 7
39
+ name: QwenGR00T
40
+ qwenvl:
41
+ base_vlm: /home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
42
+ output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0112_1323
43
+ run_id: qwen3vl_bridge_rt1_QwenGR00T_0112_1323
44
+ run_root_dir: ./Checkpoints
45
+ seed: 42
46
+ trainer:
47
+ eval_interval: 200
48
+ freeze_modules: true
49
+ gradient_accumulation_steps: 1
50
+ gradient_clipping: 1.0
51
+ is_resume: false
52
+ learning_rate:
53
+ action_model: 0.0001
54
+ base: 1.0e-05
55
+ qwen_vl_interface: 1.0e-05
56
+ logging_frequency: 50
57
+ lr_scheduler_type: cosine_with_min_lr
58
+ max_train_steps: 100000
59
+ num_warmup_steps: 10000
60
+ optimizer:
61
+ betas:
62
+ - 0.9
63
+ - 0.95
64
+ eps: 1.0e-08
65
+ weight_decay: 1.0e-08
66
+ repeated_diffusion_steps: 4
67
+ save_interval: 10000
68
+ scheduler_specific_kwargs:
69
+ min_lr: 5.0e-07
70
+ wandb_entity: lookas
71
+ wandb_project: Qwen3VL_Bridge_RT1_GR00T
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/dataset_statistics.json ADDED
@@ -0,0 +1,264 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "oxe_bridge": {
3
+ "action": {
4
+ "mean": [
5
+ 0.00011365935642970726,
6
+ 6.556110747624189e-05,
7
+ -6.320965621853247e-05,
8
+ -7.205353176686913e-05,
9
+ -0.00019515302847139537,
10
+ 0.0001203166029881686,
11
+ 0.28829458355903625
12
+ ],
13
+ "std": [
14
+ 0.006909770731857718,
15
+ 0.009684093232852218,
16
+ 0.00896290498528129,
17
+ 0.020121052930683073,
18
+ 0.021582655517295487,
19
+ 0.054723342223346974,
20
+ 0.4543627821514982
21
+ ],
22
+ "max": [
23
+ 0.41691166162490845,
24
+ 0.25864794850349426,
25
+ 0.21218234300613403,
26
+ 3.122201919555664,
27
+ 1.8618112802505493,
28
+ 6.272472858428955,
29
+ 1.0
30
+ ],
31
+ "min": [
32
+ -0.4007510244846344,
33
+ -0.13874775171279907,
34
+ -0.22553899884223938,
35
+ -3.2010786533355713,
36
+ -1.8618112802505493,
37
+ -6.279075622558594,
38
+ 0.0
39
+ ],
40
+ "q01": [
41
+ -0.02875255048274994,
42
+ -0.04170213546603918,
43
+ -0.026096721179783344,
44
+ -0.08052874729037285,
45
+ -0.09249906800687313,
46
+ -0.20738555490970612,
47
+ 0.0
48
+ ],
49
+ "q99": [
50
+ 0.028306663036346436,
51
+ 0.04089853074401617,
52
+ 0.0401805154979229,
53
+ 0.08173403143882751,
54
+ 0.07760760560631752,
55
+ 0.2038465365767479,
56
+ 1.0
57
+ ],
58
+ "mask": [
59
+ true,
60
+ true,
61
+ true,
62
+ true,
63
+ true,
64
+ true,
65
+ false
66
+ ]
67
+ },
68
+ "state": {
69
+ "mean": [
70
+ 0.15471743047237396,
71
+ 0.015362550504505634,
72
+ 0.03222028166055679,
73
+ 0.0032453201711177826,
74
+ -0.038600146770477295,
75
+ 0.05382946878671646,
76
+ 0.0,
77
+ 0.35406652092933655
78
+ ],
79
+ "std": [
80
+ 0.1605359274864927,
81
+ 0.06677912092232112,
82
+ 0.048657150951527554,
83
+ 0.09275336958940797,
84
+ 0.12566984746914736,
85
+ 0.41222738578801793,
86
+ 0.0,
87
+ 0.4330223535305803
88
+ ],
89
+ "max": [
90
+ 0.5862360596656799,
91
+ 0.4034728705883026,
92
+ 0.3568263053894043,
93
+ 1.3517684936523438,
94
+ 1.570796251296997,
95
+ 3.141204357147217,
96
+ 0.0,
97
+ 1.1121242046356201
98
+ ],
99
+ "min": [
100
+ -0.04167502000927925,
101
+ -0.3563207685947418,
102
+ -0.15537554025650024,
103
+ -3.141592502593994,
104
+ -1.4992541074752808,
105
+ -3.14153790473938,
106
+ 0.0,
107
+ 0.04637829214334488
108
+ ],
109
+ "q01": [
110
+ 0.17102622985839844,
111
+ -0.1698118858039379,
112
+ -0.055632163770496845,
113
+ -0.36493172496557236,
114
+ -0.541871190071106,
115
+ -1.354275494813919,
116
+ 0.0,
117
+ 0.052190229296684265
118
+ ],
119
+ "q99": [
120
+ 0.45322076976299286,
121
+ 0.2354845181107521,
122
+ 0.19489620998501778,
123
+ 0.3780156075954437,
124
+ 0.27568644285202026,
125
+ 1.8500566184520721,
126
+ 0.0,
127
+ 1.0105689764022827
128
+ ]
129
+ },
130
+ "num_transitions": 1305714,
131
+ "num_trajectories": 53192
132
+ },
133
+ "oxe_rt1": {
134
+ "action": {
135
+ "mean": [
136
+ 0.003493750700727105,
137
+ 0.003132961690425873,
138
+ -0.0063125672750175,
139
+ 0.02166595682501793,
140
+ -0.0028780836146324873,
141
+ 0.0004565489653032273,
142
+ 0.26771023869514465
143
+ ],
144
+ "std": [
145
+ 0.049065014465362655,
146
+ 0.04229853739828572,
147
+ 0.05237628880142378,
148
+ 0.1124860236500875,
149
+ 0.09312952783816872,
150
+ 0.10319098309601091,
151
+ 0.4418448662622395
152
+ ],
153
+ "max": [
154
+ 2.9984593391418457,
155
+ 22.09052848815918,
156
+ 2.7507524490356445,
157
+ 1.570636510848999,
158
+ 1.5321086645126343,
159
+ 1.5691522359848022,
160
+ 1.0
161
+ ],
162
+ "min": [
163
+ -2.0204520225524902,
164
+ -5.497899532318115,
165
+ -2.031663417816162,
166
+ -1.569917917251587,
167
+ -1.569892168045044,
168
+ -1.570419430732727,
169
+ 0.0
170
+ ],
171
+ "q01": [
172
+ -0.22453527510166169,
173
+ -0.14820013284683228,
174
+ -0.231589707583189,
175
+ -0.3517994859814644,
176
+ -0.4193011274933815,
177
+ -0.43643461108207704,
178
+ 0.0
179
+ ],
180
+ "q99": [
181
+ 0.17824687153100965,
182
+ 0.14938379630446405,
183
+ 0.21842354819178575,
184
+ 0.5892666035890578,
185
+ 0.35272657424211445,
186
+ 0.44796681255102094,
187
+ 1.0
188
+ ],
189
+ "mask": [
190
+ true,
191
+ true,
192
+ true,
193
+ true,
194
+ true,
195
+ true,
196
+ false
197
+ ]
198
+ },
199
+ "state": {
200
+ "mean": [
201
+ 0.2799473702907562,
202
+ -0.04167069122195244,
203
+ 0.38854750990867615,
204
+ 0.21306729316711426,
205
+ -0.12402277439832687,
206
+ 0.24756911396980286,
207
+ 0.046330634504556656,
208
+ 0.10487449914216995
209
+ ],
210
+ "std": [
211
+ 0.29342642876909925,
212
+ 0.09174024655686211,
213
+ 0.42569508885539115,
214
+ 0.38616252611341306,
215
+ 0.38314586427420927,
216
+ 0.44433568806919804,
217
+ 0.1263927443679382,
218
+ 0.22122596673781084
219
+ ],
220
+ "max": [
221
+ 1.0534898042678833,
222
+ 0.48018959164619446,
223
+ 1.6896663904190063,
224
+ 1.0,
225
+ 0.9999993443489075,
226
+ 0.9999874830245972,
227
+ 0.9554369449615479,
228
+ 0.9914546012878418
229
+ ],
230
+ "min": [
231
+ -0.4436439275741577,
232
+ -0.9970501065254211,
233
+ -0.006579156965017319,
234
+ 0.0,
235
+ -0.8643477559089661,
236
+ -0.7079970240592957,
237
+ -0.7688722014427185,
238
+ -0.4999994933605194
239
+ ],
240
+ "q01": [
241
+ 0.32481380939483645,
242
+ -0.28334290891885755,
243
+ 0.14107070609927178,
244
+ 0.0,
245
+ -0.686474204659462,
246
+ -0.6808923494815826,
247
+ -0.36045596331357954,
248
+ -0.454380963742733
249
+ ],
250
+ "q99": [
251
+ 0.8750156319141384,
252
+ 0.21247054174542404,
253
+ 1.0727112340927123,
254
+ 1.0,
255
+ 0.9377871316671368,
256
+ 0.9563051050901409,
257
+ 0.45990042358636823,
258
+ 0.7216041100025177
259
+ ]
260
+ },
261
+ "num_transitions": 3786152,
262
+ "num_trajectories": 87212
263
+ }
264
+ }
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/run_qwen3vl_bridge_rt1_qwen_gr00t.sh ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Framework_name=QwenGR00T
2
+ dit_type="DiT-B"
3
+ freeze_module_list='' # fully FT, e.g., freeze_module_list=""
4
+ data_mix=bridge_rt_1
5
+
6
+ ## Modify below paths before running ##
7
+ date_time=$(date +%m%d_%H%M)
8
+ config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml
9
+ base_vlm=/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
10
+ data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
11
+ run_root_dir=./Checkpoints
12
+ run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
13
+ batch_size=8
14
+ wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
15
+ wandb_entity=lookas
16
+
17
+ # export WANDB_MODE=disabled
18
+
19
+ output_dir=${run_root_dir}/${run_id}
20
+ mkdir -p ${output_dir}
21
+ cp $0 ${output_dir}/
22
+
23
+
24
+ accelerate launch --main_process_port 12773 \
25
+ --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
26
+ --num_processes 8 \
27
+ starVLA/training/train_starvla.py \
28
+ --config_yaml ${config_yaml} \
29
+ --framework.name ${Framework_name} \
30
+ --framework.qwenvl.base_vlm ${base_vlm} \
31
+ --datasets.vla_data.data_root_dir ${data_root_dir}\
32
+ --datasets.vla_data.data_mix ${data_mix} \
33
+ --datasets.vla_data.per_device_batch_size ${batch_size} \
34
+ --trainer.freeze_modules ${freeze_module_list} \
35
+ --trainer.max_train_steps 100000 \
36
+ --trainer.save_interval 10000 \
37
+ --trainer.logging_frequency 50 \
38
+ --trainer.eval_interval 200 \
39
+ --run_root_dir ${run_root_dir} \
40
+ --run_id ${run_id} \
41
+ --output_dir ${output_dir} \
42
+ --wandb.project ${wandb_project} \
43
+ --wandb.entity ${wandb_entity}
44
+
45
+
46
+ # multi-node launch example
47
+
48
+ # accelerate launch \
49
+ # --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
50
+ # --main_process_ip $MASTER_ADDR \
51
+ # --main_process_port $MASTER_PORT \
52
+ # --machine_rank $SLURM_PROCID \
53
+ # --num_machines $SLURM_NNODES \
54
+ # --num_processes=${TOTAL_GPUS} \
55
+ # starVLA/training/train_starvla.py \
56
+ # --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
57
+ # --framework.framework_py QwenGR00T \
58
+ # --framework.qwenvl.base_vlm microsoft/Florence-2-large \
59
+ # --run_root_dir ${run_root_dir} \
60
+ # --run_id ${run_id} \
61
+ # --wandb_project your_project \
62
+ # --wandb_entity your_name
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/summary.jsonl ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {"steps": 10000}
2
+ {"steps": 20000}
3
+ {"steps": 30000}
4
+ {"steps": 40000}
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug-internal.log ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-12T13:32:42.27765521+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-12T13:32:45.284673898+08:00","level":"INFO","msg":"stream: created new stream","id":"xgfaxrjd"}
3
+ {"time":"2026-01-12T13:32:45.284920554+08:00","level":"INFO","msg":"handler: started","stream_id":"xgfaxrjd"}
4
+ {"time":"2026-01-12T13:32:45.310206106+08:00","level":"INFO","msg":"stream: started","id":"xgfaxrjd"}
5
+ {"time":"2026-01-12T13:32:45.310216651+08:00","level":"INFO","msg":"writer: started","stream_id":"xgfaxrjd"}
6
+ {"time":"2026-01-12T13:32:45.310224054+08:00","level":"INFO","msg":"sender: started","stream_id":"xgfaxrjd"}
7
+ {"time":"2026-01-12T14:18:28.350417757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
8
+ {"time":"2026-01-12T14:38:43.346919104+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
9
+ {"time":"2026-01-12T15:18:31.304717808+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded"}
10
+ {"time":"2026-01-12T15:52:59.271728136+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
11
+ {"time":"2026-01-12T18:50:56.901819762+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
12
+ {"time":"2026-01-12T18:51:26.812243249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
13
+ {"time":"2026-01-12T22:30:01.306180525+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
14
+ {"time":"2026-01-12T22:41:55.253842283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-13T03:06:46.307270176+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
16
+ {"time":"2026-01-13T03:12:11.798876383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
17
+ {"time":"2026-01-13T03:13:26.908899958+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
18
+ {"time":"2026-01-13T05:34:26.902207579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/requirements.txt ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ starVLA==1.0.1
2
+ absl-py==2.3.1
3
+ accelerate==1.5.2
4
+ albucore==0.0.17
5
+ albumentations==1.4.18
6
+ annotated-types==0.7.0
7
+ antlr4-python3-runtime==4.9.3
8
+ anyio==4.12.0
9
+ asttokens==3.0.1
10
+ attrs==20.3.0
11
+ av==12.3.0
12
+ bddl==1.0.1
13
+ certifi==2025.11.12
14
+ charset-normalizer==3.4.4
15
+ click==8.3.1
16
+ cloudpickle==3.1.2
17
+ contourpy==1.3.2
18
+ cramjam==2.11.0
19
+ cycler==0.12.1
20
+ debugpy==1.8.19
21
+ decorator==5.2.1
22
+ decord==0.6.0
23
+ deepspeed==0.16.9
24
+ diffusers==0.36.0
25
+ docstring_parser==0.17.0
26
+ easydict==1.9
27
+ einops==0.8.1
28
+ etils==1.13.0
29
+ eva-decord==0.6.1
30
+ eval_type_backport==0.3.1
31
+ exceptiongroup==1.3.1
32
+ executing==2.2.1
33
+ fastjsonschema==2.21.2
34
+ fastparquet==2024.11.0
35
+ filelock==3.20.2
36
+ flash_attn==2.8.3
37
+ fonttools==4.61.1
38
+ fsspec==2025.12.0
39
+ future==0.18.2
40
+ fvcore==0.1.5.post20221221
41
+ gevent==25.9.1
42
+ gitdb==4.0.12
43
+ GitPython==3.1.46
44
+ glfw==2.10.0
45
+ greenlet==3.3.0
46
+ grpcio==1.76.0
47
+ gym==0.26.2
48
+ gym-notices==0.1.0
49
+ h11==0.16.0
50
+ hf-xet==1.2.0
51
+ hjson==3.1.0
52
+ httpcore==1.0.9
53
+ httpx==0.28.1
54
+ huggingface-hub==0.36.0
55
+ idna==3.11
56
+ ImageIO==2.37.2
57
+ importlib_metadata==8.7.1
58
+ importlib_resources==6.5.2
59
+ iniconfig==2.3.0
60
+ iopath==0.1.10
61
+ ipdb==0.13.13
62
+ ipython==8.37.0
63
+ jedi==0.19.2
64
+ Jinja2==3.1.6
65
+ jsonschema==4.17.3
66
+ jupyter_core==5.9.1
67
+ jupytext==1.18.1
68
+ kiwisolver==1.4.9
69
+ lazy_loader==0.4
70
+ libero==0.1.0
71
+ llvmlite==0.46.0
72
+ Markdown==3.10
73
+ markdown-it-py==4.0.0
74
+ MarkupSafe==3.0.3
75
+ matplotlib==3.10.8
76
+ matplotlib-inline==0.2.1
77
+ mdit-py-plugins==0.5.0
78
+ mdurl==0.1.2
79
+ mpmath==1.3.0
80
+ msgpack==1.1.2
81
+ mujoco==3.4.0
82
+ nbformat==5.10.4
83
+ networkx==3.4.2
84
+ ninja==1.13.0
85
+ numba==0.63.1
86
+ numpy==1.26.4
87
+ numpydantic==1.6.9
88
+ nvidia-cublas-cu12==12.4.5.8
89
+ nvidia-cuda-cupti-cu12==12.4.127
90
+ nvidia-cuda-nvrtc-cu12==12.4.127
91
+ nvidia-cuda-runtime-cu12==12.4.127
92
+ nvidia-cudnn-cu12==9.1.0.70
93
+ nvidia-cufft-cu12==11.2.1.3
94
+ nvidia-curand-cu12==10.3.5.147
95
+ nvidia-cusolver-cu12==11.6.1.9
96
+ nvidia-cusparse-cu12==12.3.1.170
97
+ nvidia-nccl-cu12==2.21.5
98
+ nvidia-nvjitlink-cu12==12.4.127
99
+ nvidia-nvtx-cu12==12.4.127
100
+ omegaconf==2.3.0
101
+ opencv-python==4.11.0.86
102
+ opencv-python-headless==4.11.0.86
103
+ packaging==25.0
104
+ pandas==2.3.3
105
+ parso==0.8.5
106
+ pexpect==4.9.0
107
+ pillow==12.1.0
108
+ pipablepytorch3d==0.7.6
109
+ platformdirs==4.5.1
110
+ pluggy==1.6.0
111
+ portalocker==3.2.0
112
+ prompt_toolkit==3.0.52
113
+ protobuf==6.33.2
114
+ psutil==7.2.1
115
+ ptyprocess==0.7.0
116
+ pure_eval==0.2.3
117
+ py-cpuinfo==9.0.0
118
+ pyarrow==14.0.1
119
+ pydantic==2.10.6
120
+ pydantic_core==2.27.2
121
+ Pygments==2.19.2
122
+ PyOpenGL==3.1.10
123
+ pyparsing==3.3.1
124
+ pyrsistent==0.20.0
125
+ pytest==9.0.2
126
+ python-dateutil==2.9.0.post0
127
+ pytz==2025.2
128
+ PyYAML==6.0.3
129
+ qwen-vl-utils==0.0.14
130
+ regex==2025.11.3
131
+ requests==2.32.5
132
+ rich==14.2.0
133
+ robosuite==1.4.0
134
+ safetensors==0.7.0
135
+ scikit-image==0.25.2
136
+ scipy==1.15.3
137
+ sentry-sdk==2.48.0
138
+ setuptools==80.9.0
139
+ six==1.17.0
140
+ smmap==5.0.2
141
+ stack-data==0.6.3
142
+ starVLA==1.0.1
143
+ sympy==1.13.1
144
+ tabulate==0.9.0
145
+ tensorboard==2.20.0
146
+ tensorboard-data-server==0.7.2
147
+ termcolor==3.3.0
148
+ tifffile==2025.5.10
149
+ tiktoken==0.12.0
150
+ timm==1.0.22
151
+ tokenizers==0.22.1
152
+ tomli==2.3.0
153
+ torch==2.5.1
154
+ torchvision==0.20.1
155
+ tqdm==4.67.1
156
+ traitlets==5.14.3
157
+ transformers==4.57.3
158
+ transformers-stream-generator==0.0.4
159
+ triton==3.1.0
160
+ typeguard==4.4.4
161
+ typing_extensions==4.15.0
162
+ tyro==1.0.3
163
+ tzdata==2025.3
164
+ urllib3==2.6.2
165
+ wandb==0.23.1
166
+ wcwidth==0.2.14
167
+ websocket==0.2.1
168
+ websocket-client==1.8.0
169
+ websockets==15.0.1
170
+ Werkzeug==3.1.4
171
+ yacs==0.1.8
172
+ zipp==3.23.0
173
+ zope.event==6.1
174
+ zope.interface==8.1.1
175
+ autocommand==2.2.2
176
+ backports.tarfile==1.2.0
177
+ importlib_metadata==8.0.0
178
+ inflect==7.3.1
179
+ jaraco.collections==5.1.0
180
+ jaraco.context==5.3.0
181
+ jaraco.functools==4.0.1
182
+ jaraco.text==3.12.1
183
+ more-itertools==10.3.0
184
+ packaging==24.2
185
+ platformdirs==4.2.2
186
+ tomli==2.0.1
187
+ typeguard==4.3.0
188
+ typing_extensions==4.12.2
189
+ wheel==0.45.1
190
+ zipp==3.19.2
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/wandb-metadata.json ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36",
3
+ "python": "CPython 3.10.19",
4
+ "startedAt": "2026-01-12T05:32:35.945274Z",
5
+ "args": [
6
+ "--config_yaml",
7
+ "scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml",
8
+ "--framework.name",
9
+ "QwenGR00T",
10
+ "--framework.qwenvl.base_vlm",
11
+ "/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b",
12
+ "--datasets.vla_data.data_root_dir",
13
+ "./playground/Datasets/OXE_LEROBOT",
14
+ "--datasets.vla_data.data_mix",
15
+ "bridge_rt_1",
16
+ "--datasets.vla_data.per_device_batch_size",
17
+ "8",
18
+ "--trainer.freeze_modules",
19
+ "--trainer.max_train_steps",
20
+ "100000",
21
+ "--trainer.save_interval",
22
+ "10000",
23
+ "--trainer.logging_frequency",
24
+ "50",
25
+ "--trainer.eval_interval",
26
+ "200",
27
+ "--run_root_dir",
28
+ "./Checkpoints",
29
+ "--run_id",
30
+ "qwen3vl_bridge_rt1_QwenGR00T_0112_1323",
31
+ "--output_dir",
32
+ "./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0112_1323",
33
+ "--wandb.project",
34
+ "Qwen3VL_Bridge_RT1_QwenGR00T",
35
+ "--wandb.entity",
36
+ "lookas"
37
+ ],
38
+ "program": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py",
39
+ "codePath": "starVLA/training/train_starvla.py",
40
+ "codePathLocal": "starVLA/training/train_starvla.py",
41
+ "git": {
42
+ "remote": "https://github.com/hilookas/starVLA_pickxiguapi",
43
+ "commit": "ab531aff5b27795879c61f67892330a616e9dbf0"
44
+ },
45
+ "email": "hilookas@gmail.com",
46
+ "root": "./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb",
47
+ "host": "g340-cd51-7700-67c8-4915-9975-7e66",
48
+ "executable": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3",
49
+ "cpu_count": 90,
50
+ "cpu_count_logical": 180,
51
+ "gpu": "NVIDIA H20",
52
+ "gpu_count": 8,
53
+ "disk": {
54
+ "/": {
55
+ "total": "3779301580800",
56
+ "used": "139867217920"
57
+ }
58
+ },
59
+ "memory": {
60
+ "total": "2071188119552"
61
+ },
62
+ "gpu_nvidia": [
63
+ {
64
+ "name": "NVIDIA H20",
65
+ "memoryTotal": "102625181696",
66
+ "cudaCores": 9984,
67
+ "architecture": "Hopper",
68
+ "uuid": "GPU-d59be83b-3536-1644-2091-0f4464032f14"
69
+ },
70
+ {
71
+ "name": "NVIDIA H20",
72
+ "memoryTotal": "102625181696",
73
+ "cudaCores": 9984,
74
+ "architecture": "Hopper",
75
+ "uuid": "GPU-bc06cfc2-31e9-cd6e-d8cd-635061ed592f"
76
+ },
77
+ {
78
+ "name": "NVIDIA H20",
79
+ "memoryTotal": "102625181696",
80
+ "cudaCores": 9984,
81
+ "architecture": "Hopper",
82
+ "uuid": "GPU-019dac1d-8bed-5b35-1123-cbd9d65ba9de"
83
+ },
84
+ {
85
+ "name": "NVIDIA H20",
86
+ "memoryTotal": "102625181696",
87
+ "cudaCores": 9984,
88
+ "architecture": "Hopper",
89
+ "uuid": "GPU-9ac2a386-251e-3a51-5ac7-fa4b1357bc91"
90
+ },
91
+ {
92
+ "name": "NVIDIA H20",
93
+ "memoryTotal": "102625181696",
94
+ "cudaCores": 9984,
95
+ "architecture": "Hopper",
96
+ "uuid": "GPU-1c0156f1-dfe3-af70-9511-34e6b131ef06"
97
+ },
98
+ {
99
+ "name": "NVIDIA H20",
100
+ "memoryTotal": "102625181696",
101
+ "cudaCores": 9984,
102
+ "architecture": "Hopper",
103
+ "uuid": "GPU-953d951d-56e0-a563-5ca6-5acc1f8559e3"
104
+ },
105
+ {
106
+ "name": "NVIDIA H20",
107
+ "memoryTotal": "102625181696",
108
+ "cudaCores": 9984,
109
+ "architecture": "Hopper",
110
+ "uuid": "GPU-70a05065-a0d0-7ff4-9204-e0714e9f25c4"
111
+ },
112
+ {
113
+ "name": "NVIDIA H20",
114
+ "memoryTotal": "102625181696",
115
+ "cudaCores": 9984,
116
+ "architecture": "Hopper",
117
+ "uuid": "GPU-daf390d3-2cbb-d20b-9fde-c5a09c17084b"
118
+ }
119
+ ],
120
+ "cudaVersion": "12.4",
121
+ "writerId": "0zkhoms4zvynscihrkuls5t7ju1xvttv"
122
+ }
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug-internal.log ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-12T13:32:42.27765521+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-12T13:32:45.284673898+08:00","level":"INFO","msg":"stream: created new stream","id":"xgfaxrjd"}
3
+ {"time":"2026-01-12T13:32:45.284920554+08:00","level":"INFO","msg":"handler: started","stream_id":"xgfaxrjd"}
4
+ {"time":"2026-01-12T13:32:45.310206106+08:00","level":"INFO","msg":"stream: started","id":"xgfaxrjd"}
5
+ {"time":"2026-01-12T13:32:45.310216651+08:00","level":"INFO","msg":"writer: started","stream_id":"xgfaxrjd"}
6
+ {"time":"2026-01-12T13:32:45.310224054+08:00","level":"INFO","msg":"sender: started","stream_id":"xgfaxrjd"}
7
+ {"time":"2026-01-12T14:18:28.350417757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
8
+ {"time":"2026-01-12T14:38:43.346919104+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
9
+ {"time":"2026-01-12T15:18:31.304717808+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded"}
10
+ {"time":"2026-01-12T15:52:59.271728136+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
11
+ {"time":"2026-01-12T18:50:56.901819762+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
12
+ {"time":"2026-01-12T18:51:26.812243249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
13
+ {"time":"2026-01-12T22:30:01.306180525+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
14
+ {"time":"2026-01-12T22:41:55.253842283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-13T03:06:46.307270176+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
16
+ {"time":"2026-01-13T03:12:11.798876383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
17
+ {"time":"2026-01-13T03:13:26.908899958+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
18
+ {"time":"2026-01-13T05:34:26.902207579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/run-xgfaxrjd.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:045e7281399b037c32de3a2f64aefac1cc2f8d4a536831b05f86c2df5f57c487
3
+ size 49053696
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/config.yaml ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
4
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
5
+ data_mix: bridge_rt_1
6
+ data_root_dir: ./playground/Datasets/OXE_LEROBOT
7
+ dataset_py: lerobot_datasets
8
+ image_size:
9
+ - 224
10
+ - 224
11
+ per_device_batch_size: 8
12
+ video_backend: torchvision_av
13
+ framework:
14
+ action_model:
15
+ action_dim: 7
16
+ action_horizon: 16
17
+ action_model_type: DiT-B
18
+ add_pos_embed: true
19
+ diffusion_model_cfg:
20
+ cross_attention_dim: 4096
21
+ dropout: 0.2
22
+ final_dropout: true
23
+ interleave_self_attention: true
24
+ norm_type: ada_norm
25
+ num_layers: 16
26
+ output_dim: 1024
27
+ positional_embeddings: null
28
+ future_action_window_size: 15
29
+ hidden_size: 1024
30
+ max_seq_len: 1024
31
+ noise_beta_alpha: 1.5
32
+ noise_beta_beta: 1.0
33
+ noise_s: 0.999
34
+ num_inference_timesteps: 4
35
+ num_target_vision_tokens: 32
36
+ num_timestep_buckets: 1000
37
+ past_action_window_size: 0
38
+ state_dim: 7
39
+ name: QwenGR00T
40
+ qwenvl:
41
+ base_vlm: /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
42
+ output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747
43
+ run_id: qwen3vl_bridge_rt1_QwenGR00T_0117_1747
44
+ run_root_dir: ./Checkpoints
45
+ seed: 42
46
+ trainer:
47
+ eval_interval: 200
48
+ freeze_modules: true
49
+ gradient_accumulation_steps: 1
50
+ gradient_clipping: 1.0
51
+ is_resume: false
52
+ learning_rate:
53
+ action_model: 0.0001
54
+ base: 1.0e-05
55
+ qwen_vl_interface: 1.0e-05
56
+ logging_frequency: 50
57
+ lr_scheduler_type: cosine_with_min_lr
58
+ max_train_steps: 100000
59
+ num_warmup_steps: 10000
60
+ optimizer:
61
+ betas:
62
+ - 0.9
63
+ - 0.95
64
+ eps: 1.0e-08
65
+ weight_decay: 1.0e-08
66
+ repeated_diffusion_steps: 4
67
+ save_interval: 10000
68
+ scheduler_specific_kwargs:
69
+ min_lr: 5.0e-07
70
+ wandb_entity: lookas
71
+ wandb_project: Qwen3VL_Bridge_RT1_GR00T
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/dataset_statistics.json ADDED
@@ -0,0 +1,264 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "oxe_bridge": {
3
+ "action": {
4
+ "mean": [
5
+ 0.00011365935642970726,
6
+ 6.556110747624189e-05,
7
+ -6.320965621853247e-05,
8
+ -7.205353176686913e-05,
9
+ -0.00019515302847139537,
10
+ 0.0001203166029881686,
11
+ 0.28829458355903625
12
+ ],
13
+ "std": [
14
+ 0.006909770731857718,
15
+ 0.009684093232852218,
16
+ 0.00896290498528129,
17
+ 0.020121052930683073,
18
+ 0.021582655517295487,
19
+ 0.054723342223346974,
20
+ 0.4543627821514982
21
+ ],
22
+ "max": [
23
+ 0.41691166162490845,
24
+ 0.25864794850349426,
25
+ 0.21218234300613403,
26
+ 3.122201919555664,
27
+ 1.8618112802505493,
28
+ 6.272472858428955,
29
+ 1.0
30
+ ],
31
+ "min": [
32
+ -0.4007510244846344,
33
+ -0.13874775171279907,
34
+ -0.22553899884223938,
35
+ -3.2010786533355713,
36
+ -1.8618112802505493,
37
+ -6.279075622558594,
38
+ 0.0
39
+ ],
40
+ "q01": [
41
+ -0.02875255048274994,
42
+ -0.04170213546603918,
43
+ -0.026096721179783344,
44
+ -0.08052874729037285,
45
+ -0.09249906800687313,
46
+ -0.20738555490970612,
47
+ 0.0
48
+ ],
49
+ "q99": [
50
+ 0.028306663036346436,
51
+ 0.04089853074401617,
52
+ 0.0401805154979229,
53
+ 0.08173403143882751,
54
+ 0.07760760560631752,
55
+ 0.2038465365767479,
56
+ 1.0
57
+ ],
58
+ "mask": [
59
+ true,
60
+ true,
61
+ true,
62
+ true,
63
+ true,
64
+ true,
65
+ false
66
+ ]
67
+ },
68
+ "state": {
69
+ "mean": [
70
+ 0.15471743047237396,
71
+ 0.015362550504505634,
72
+ 0.03222028166055679,
73
+ 0.0032453201711177826,
74
+ -0.038600146770477295,
75
+ 0.05382946878671646,
76
+ 0.0,
77
+ 0.35406652092933655
78
+ ],
79
+ "std": [
80
+ 0.1605359274864927,
81
+ 0.06677912092232112,
82
+ 0.048657150951527554,
83
+ 0.09275336958940797,
84
+ 0.12566984746914736,
85
+ 0.41222738578801793,
86
+ 0.0,
87
+ 0.4330223535305803
88
+ ],
89
+ "max": [
90
+ 0.5862360596656799,
91
+ 0.4034728705883026,
92
+ 0.3568263053894043,
93
+ 1.3517684936523438,
94
+ 1.570796251296997,
95
+ 3.141204357147217,
96
+ 0.0,
97
+ 1.1121242046356201
98
+ ],
99
+ "min": [
100
+ -0.04167502000927925,
101
+ -0.3563207685947418,
102
+ -0.15537554025650024,
103
+ -3.141592502593994,
104
+ -1.4992541074752808,
105
+ -3.14153790473938,
106
+ 0.0,
107
+ 0.04637829214334488
108
+ ],
109
+ "q01": [
110
+ 0.17102622985839844,
111
+ -0.1698118858039379,
112
+ -0.055632163770496845,
113
+ -0.36493172496557236,
114
+ -0.541871190071106,
115
+ -1.354275494813919,
116
+ 0.0,
117
+ 0.052190229296684265
118
+ ],
119
+ "q99": [
120
+ 0.45322076976299286,
121
+ 0.2354845181107521,
122
+ 0.19489620998501778,
123
+ 0.3780156075954437,
124
+ 0.27568644285202026,
125
+ 1.8500566184520721,
126
+ 0.0,
127
+ 1.0105689764022827
128
+ ]
129
+ },
130
+ "num_transitions": 1305714,
131
+ "num_trajectories": 53192
132
+ },
133
+ "oxe_rt1": {
134
+ "action": {
135
+ "mean": [
136
+ 0.003493750700727105,
137
+ 0.003132961690425873,
138
+ -0.0063125672750175,
139
+ 0.02166595682501793,
140
+ -0.0028780836146324873,
141
+ 0.0004565489653032273,
142
+ 0.26771023869514465
143
+ ],
144
+ "std": [
145
+ 0.049065014465362655,
146
+ 0.04229853739828572,
147
+ 0.05237628880142378,
148
+ 0.1124860236500875,
149
+ 0.09312952783816872,
150
+ 0.10319098309601091,
151
+ 0.4418448662622395
152
+ ],
153
+ "max": [
154
+ 2.9984593391418457,
155
+ 22.09052848815918,
156
+ 2.7507524490356445,
157
+ 1.570636510848999,
158
+ 1.5321086645126343,
159
+ 1.5691522359848022,
160
+ 1.0
161
+ ],
162
+ "min": [
163
+ -2.0204520225524902,
164
+ -5.497899532318115,
165
+ -2.031663417816162,
166
+ -1.569917917251587,
167
+ -1.569892168045044,
168
+ -1.570419430732727,
169
+ 0.0
170
+ ],
171
+ "q01": [
172
+ -0.22453527510166169,
173
+ -0.14820013284683228,
174
+ -0.231589707583189,
175
+ -0.3517994859814644,
176
+ -0.4193011274933815,
177
+ -0.43643461108207704,
178
+ 0.0
179
+ ],
180
+ "q99": [
181
+ 0.17824687153100965,
182
+ 0.14938379630446405,
183
+ 0.21842354819178575,
184
+ 0.5892666035890578,
185
+ 0.35272657424211445,
186
+ 0.44796681255102094,
187
+ 1.0
188
+ ],
189
+ "mask": [
190
+ true,
191
+ true,
192
+ true,
193
+ true,
194
+ true,
195
+ true,
196
+ false
197
+ ]
198
+ },
199
+ "state": {
200
+ "mean": [
201
+ 0.2799473702907562,
202
+ -0.04167069122195244,
203
+ 0.38854750990867615,
204
+ 0.21306729316711426,
205
+ -0.12402277439832687,
206
+ 0.24756911396980286,
207
+ 0.046330634504556656,
208
+ 0.10487449914216995
209
+ ],
210
+ "std": [
211
+ 0.29342642876909925,
212
+ 0.09174024655686211,
213
+ 0.42569508885539115,
214
+ 0.38616252611341306,
215
+ 0.38314586427420927,
216
+ 0.44433568806919804,
217
+ 0.1263927443679382,
218
+ 0.22122596673781084
219
+ ],
220
+ "max": [
221
+ 1.0534898042678833,
222
+ 0.48018959164619446,
223
+ 1.6896663904190063,
224
+ 1.0,
225
+ 0.9999993443489075,
226
+ 0.9999874830245972,
227
+ 0.9554369449615479,
228
+ 0.9914546012878418
229
+ ],
230
+ "min": [
231
+ -0.4436439275741577,
232
+ -0.9970501065254211,
233
+ -0.006579156965017319,
234
+ 0.0,
235
+ -0.8643477559089661,
236
+ -0.7079970240592957,
237
+ -0.7688722014427185,
238
+ -0.4999994933605194
239
+ ],
240
+ "q01": [
241
+ 0.32481380939483645,
242
+ -0.28334290891885755,
243
+ 0.14107070609927178,
244
+ 0.0,
245
+ -0.686474204659462,
246
+ -0.6808923494815826,
247
+ -0.36045596331357954,
248
+ -0.454380963742733
249
+ ],
250
+ "q99": [
251
+ 0.8750156319141384,
252
+ 0.21247054174542404,
253
+ 1.0727112340927123,
254
+ 1.0,
255
+ 0.9377871316671368,
256
+ 0.9563051050901409,
257
+ 0.45990042358636823,
258
+ 0.7216041100025177
259
+ ]
260
+ },
261
+ "num_transitions": 3786152,
262
+ "num_trajectories": 87212
263
+ }
264
+ }
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/run_qwen3vl_bridge_rt1_qwen_gr00t.sh ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Framework_name=QwenGR00T
2
+ dit_type="DiT-B"
3
+ freeze_module_list='' # fully FT, e.g., freeze_module_list=""
4
+ data_mix=bridge_rt_1
5
+
6
+ ## Modify below paths before running ##
7
+ date_time=$(date +%m%d_%H%M)
8
+ config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml
9
+ base_vlm=/home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
10
+ data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
11
+ run_root_dir=./Checkpoints
12
+ run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
13
+ batch_size=8
14
+ wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
15
+ wandb_entity=lookas
16
+
17
+ # export WANDB_MODE=disabled
18
+
19
+ output_dir=${run_root_dir}/${run_id}
20
+ mkdir -p ${output_dir}
21
+ cp $0 ${output_dir}/
22
+
23
+
24
+ accelerate launch --main_process_port 12773 \
25
+ --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
26
+ --num_processes 8 \
27
+ starVLA/training/train_starvla.py \
28
+ --config_yaml ${config_yaml} \
29
+ --framework.name ${Framework_name} \
30
+ --framework.qwenvl.base_vlm ${base_vlm} \
31
+ --datasets.vla_data.data_root_dir ${data_root_dir}\
32
+ --datasets.vla_data.data_mix ${data_mix} \
33
+ --datasets.vla_data.per_device_batch_size ${batch_size} \
34
+ --trainer.freeze_modules ${freeze_module_list} \
35
+ --trainer.max_train_steps 100000 \
36
+ --trainer.save_interval 10000 \
37
+ --trainer.logging_frequency 50 \
38
+ --trainer.eval_interval 200 \
39
+ --run_root_dir ${run_root_dir} \
40
+ --run_id ${run_id} \
41
+ --output_dir ${output_dir} \
42
+ --wandb.project ${wandb_project} \
43
+ --wandb.entity ${wandb_entity}
44
+
45
+
46
+ # multi-node launch example
47
+
48
+ # accelerate launch \
49
+ # --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
50
+ # --main_process_ip $MASTER_ADDR \
51
+ # --main_process_port $MASTER_PORT \
52
+ # --machine_rank $SLURM_PROCID \
53
+ # --num_machines $SLURM_NNODES \
54
+ # --num_processes=${TOTAL_GPUS} \
55
+ # starVLA/training/train_starvla.py \
56
+ # --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
57
+ # --framework.framework_py QwenGR00T \
58
+ # --framework.qwenvl.base_vlm microsoft/Florence-2-large \
59
+ # --run_root_dir ${run_root_dir} \
60
+ # --run_id ${run_id} \
61
+ # --wandb_project your_project \
62
+ # --wandb_entity your_name
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/summary.jsonl ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {"steps": 10000}
2
+ {"steps": 20000}
3
+ {"steps": 30000}
4
+ {"steps": 40000}
5
+ {"steps": 50000}
6
+ {"steps": 60000}
7
+ {"steps": 70000}
8
+ {"steps": 80000}
9
+ {"steps": 90000}
10
+ {"steps": 100000}
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug-internal.log ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-17T18:03:45.356692165+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-17T18:03:48.552330417+08:00","level":"INFO","msg":"stream: created new stream","id":"xbap43rk"}
3
+ {"time":"2026-01-17T18:03:48.552524112+08:00","level":"INFO","msg":"handler: started","stream_id":"xbap43rk"}
4
+ {"time":"2026-01-17T18:03:48.577796615+08:00","level":"INFO","msg":"stream: started","id":"xbap43rk"}
5
+ {"time":"2026-01-17T18:03:48.577817586+08:00","level":"INFO","msg":"writer: started","stream_id":"xbap43rk"}
6
+ {"time":"2026-01-17T18:03:48.577832655+08:00","level":"INFO","msg":"sender: started","stream_id":"xbap43rk"}
7
+ {"time":"2026-01-17T20:02:17.852359064+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
8
+ {"time":"2026-01-17T20:04:33.007831623+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
9
+ {"time":"2026-01-17T20:35:32.863685268+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
10
+ {"time":"2026-01-17T22:03:46.318542143+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
11
+ {"time":"2026-01-17T22:48:34.635180932+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
12
+ {"time":"2026-01-17T22:55:57.518503703+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
13
+ {"time":"2026-01-17T23:07:48.293218261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
14
+ {"time":"2026-01-17T23:08:32.231325893+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-17T23:12:50.87203047+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
16
+ {"time":"2026-01-17T23:13:18.698788758+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": http2: client conn is closed"}
17
+ {"time":"2026-01-17T23:16:49.881636821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
18
+ {"time":"2026-01-17T23:25:00.472362504+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
19
+ {"time":"2026-01-18T00:16:02.236615436+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
20
+ {"time":"2026-01-18T00:33:00.268425846+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
21
+ {"time":"2026-01-18T00:33:13.186386827+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
22
+ {"time":"2026-01-18T02:52:45.26127457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
23
+ {"time":"2026-01-18T02:53:30.366178096+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
24
+ {"time":"2026-01-18T04:54:45.36780745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
25
+ {"time":"2026-01-18T04:55:30.238642915+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
26
+ {"time":"2026-01-18T04:55:42.722661208+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
27
+ {"time":"2026-01-18T04:56:15.382797183+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
28
+ {"time":"2026-01-18T08:43:45.342343851+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
29
+ {"time":"2026-01-18T08:44:00.358330288+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
30
+ {"time":"2026-01-18T08:44:30.251461638+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
31
+ {"time":"2026-01-18T10:47:45.345590419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
32
+ {"time":"2026-01-18T12:47:15.286316861+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
33
+ {"time":"2026-01-18T13:40:46.383240786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
34
+ {"time":"2026-01-18T16:22:00.269227917+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
35
+ {"time":"2026-01-18T16:23:00.259212087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
36
+ {"time":"2026-01-18T16:26:15.279544821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
37
+ {"time":"2026-01-18T16:28:15.394951264+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
38
+ {"time":"2026-01-18T16:28:28.376139107+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
39
+ {"time":"2026-01-18T16:32:34.771745298+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
40
+ {"time":"2026-01-18T16:32:50.854108579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
41
+ {"time":"2026-01-18T16:33:15.253909146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
42
+ {"time":"2026-01-18T16:33:30.268871735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
43
+ {"time":"2026-01-18T16:33:45.254149217+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
44
+ {"time":"2026-01-18T16:33:57.84608755+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
45
+ {"time":"2026-01-18T16:34:14.118425621+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
46
+ {"time":"2026-01-18T16:34:26.791643445+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
47
+ {"time":"2026-01-18T16:35:30.392649391+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
48
+ {"time":"2026-01-18T16:35:45.390391138+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
49
+ {"time":"2026-01-18T16:37:00.231753869+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
50
+ {"time":"2026-01-18T16:39:00.308923433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
51
+ {"time":"2026-01-18T16:50:44.109993399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
52
+ {"time":"2026-01-18T16:56:44.222721195+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
53
+ {"time":"2026-01-18T16:56:59.182350472+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
54
+ {"time":"2026-01-18T16:57:12.200012616+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
55
+ {"time":"2026-01-18T16:57:30.278294605+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
56
+ {"time":"2026-01-18T16:57:45.272613563+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
57
+ {"time":"2026-01-18T16:57:58.361466419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
58
+ {"time":"2026-01-18T16:58:16.374502713+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
59
+ {"time":"2026-01-18T17:01:49.770643385+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
60
+ {"time":"2026-01-18T17:03:00.288457229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
61
+ {"time":"2026-01-18T17:03:45.353334974+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
62
+ {"time":"2026-01-18T18:17:45.365055726+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
63
+ {"time":"2026-01-18T18:24:00.357867283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
64
+ {"time":"2026-01-18T19:06:15.375047877+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
65
+ {"time":"2026-01-18T19:06:28.413756607+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
66
+ {"time":"2026-01-18T19:15:30.232002999+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
67
+ {"time":"2026-01-18T19:39:30.251864251+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
68
+ {"time":"2026-01-18T19:40:00.288831216+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
69
+ {"time":"2026-01-18T19:52:30.252619907+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
70
+ {"time":"2026-01-18T20:51:49.773485296+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
71
+ {"time":"2026-01-18T21:32:54.188737252+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
72
+ {"time":"2026-01-18T22:14:31.789385651+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
73
+ {"time":"2026-01-19T00:11:15.393839366+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
74
+ {"time":"2026-01-19T00:50:30.380524837+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
75
+ {"time":"2026-01-19T00:51:00.395000654+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
76
+ {"time":"2026-01-19T00:51:13.162530742+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
77
+ {"time":"2026-01-19T00:54:30.249839041+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
78
+ {"time":"2026-01-19T00:55:30.349433303+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
79
+ {"time":"2026-01-19T01:00:31.333972122+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
80
+ {"time":"2026-01-19T01:19:30.367251508+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
81
+ {"time":"2026-01-19T01:20:30.296201955+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
82
+ {"time":"2026-01-19T01:51:00.221611746+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
83
+ {"time":"2026-01-19T01:52:30.445846213+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
84
+ {"time":"2026-01-19T02:02:15.651403576+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
85
+ {"time":"2026-01-19T02:02:17.343084437+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
86
+ {"time":"2026-01-19T02:02:17.352284781+08:00","level":"INFO","msg":"stream: closing","id":"xbap43rk"}
87
+ {"time":"2026-01-19T02:02:17.35229661+08:00","level":"INFO","msg":"handler: closed","stream_id":"xbap43rk"}
88
+ {"time":"2026-01-19T02:02:17.384196864+08:00","level":"INFO","msg":"sender: closed","stream_id":"xbap43rk"}
89
+ {"time":"2026-01-19T02:02:17.384209276+08:00","level":"INFO","msg":"stream: closed","id":"xbap43rk"}
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/config.yaml ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.23.1
4
+ e:
5
+ qsdugxujhb6s3j19wae2dfqwajsgmsw2:
6
+ args:
7
+ - --config_yaml
8
+ - scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml
9
+ - --framework.name
10
+ - QwenGR00T
11
+ - --framework.qwenvl.base_vlm
12
+ - /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
13
+ - --datasets.vla_data.data_root_dir
14
+ - ./playground/Datasets/OXE_LEROBOT
15
+ - --datasets.vla_data.data_mix
16
+ - bridge_rt_1
17
+ - --datasets.vla_data.per_device_batch_size
18
+ - "8"
19
+ - --trainer.freeze_modules
20
+ - --trainer.max_train_steps
21
+ - "100000"
22
+ - --trainer.save_interval
23
+ - "10000"
24
+ - --trainer.logging_frequency
25
+ - "50"
26
+ - --trainer.eval_interval
27
+ - "200"
28
+ - --run_root_dir
29
+ - ./Checkpoints
30
+ - --run_id
31
+ - qwen3vl_bridge_rt1_QwenGR00T_0117_1747
32
+ - --output_dir
33
+ - ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747
34
+ - --wandb.project
35
+ - Qwen3VL_Bridge_RT1_QwenGR00T
36
+ - --wandb.entity
37
+ - lookas
38
+ codePath: starVLA/training/train_starvla.py
39
+ codePathLocal: starVLA/training/train_starvla.py
40
+ cpu_count: 90
41
+ cpu_count_logical: 180
42
+ cudaVersion: "12.4"
43
+ disk:
44
+ /:
45
+ total: "3779301580800"
46
+ used: "151673700352"
47
+ email: hilookas@gmail.com
48
+ executable: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3
49
+ git:
50
+ commit: ab531aff5b27795879c61f67892330a616e9dbf0
51
+ remote: https://github.com/hilookas/starVLA_pickxiguapi
52
+ gpu: NVIDIA H20
53
+ gpu_count: 8
54
+ gpu_nvidia:
55
+ - architecture: Hopper
56
+ cudaCores: 9984
57
+ memoryTotal: "102625181696"
58
+ name: NVIDIA H20
59
+ uuid: GPU-f99bae5f-ffca-4972-6420-64c42ba64f22
60
+ - architecture: Hopper
61
+ cudaCores: 9984
62
+ memoryTotal: "102625181696"
63
+ name: NVIDIA H20
64
+ uuid: GPU-a00709c9-6bdf-4011-64dc-95421da94ba4
65
+ - architecture: Hopper
66
+ cudaCores: 9984
67
+ memoryTotal: "102625181696"
68
+ name: NVIDIA H20
69
+ uuid: GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5
70
+ - architecture: Hopper
71
+ cudaCores: 9984
72
+ memoryTotal: "102625181696"
73
+ name: NVIDIA H20
74
+ uuid: GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9
75
+ - architecture: Hopper
76
+ cudaCores: 9984
77
+ memoryTotal: "102625181696"
78
+ name: NVIDIA H20
79
+ uuid: GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218
80
+ - architecture: Hopper
81
+ cudaCores: 9984
82
+ memoryTotal: "102625181696"
83
+ name: NVIDIA H20
84
+ uuid: GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde
85
+ - architecture: Hopper
86
+ cudaCores: 9984
87
+ memoryTotal: "102625181696"
88
+ name: NVIDIA H20
89
+ uuid: GPU-4fa493fc-c408-182f-138e-bcc15c7f9138
90
+ - architecture: Hopper
91
+ cudaCores: 9984
92
+ memoryTotal: "102625181696"
93
+ name: NVIDIA H20
94
+ uuid: GPU-16ef9185-6132-8620-ad2e-1f8920ded508
95
+ host: g340-cd51-7700-770-343f-3fec-69bb
96
+ memory:
97
+ total: "2071188119552"
98
+ os: Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36
99
+ program: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py
100
+ python: CPython 3.10.19
101
+ root: ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb
102
+ startedAt: "2026-01-17T10:03:39.069637Z"
103
+ writerId: qsdugxujhb6s3j19wae2dfqwajsgmsw2
104
+ m: []
105
+ python_version: 3.10.19
106
+ t:
107
+ "1":
108
+ - 1
109
+ - 11
110
+ - 41
111
+ - 49
112
+ - 63
113
+ - 71
114
+ - 80
115
+ - 83
116
+ "2":
117
+ - 1
118
+ - 11
119
+ - 41
120
+ - 49
121
+ - 63
122
+ - 71
123
+ - 80
124
+ - 83
125
+ "3":
126
+ - 2
127
+ - 13
128
+ - 61
129
+ "4": 3.10.19
130
+ "5": 0.23.1
131
+ "6": 4.57.3
132
+ "12": 0.23.1
133
+ "13": linux-x86_64
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/requirements.txt ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ starVLA==1.0.1
2
+ absl-py==2.3.1
3
+ accelerate==1.5.2
4
+ albucore==0.0.17
5
+ albumentations==1.4.18
6
+ annotated-types==0.7.0
7
+ antlr4-python3-runtime==4.9.3
8
+ anyio==4.12.0
9
+ asttokens==3.0.1
10
+ attrs==20.3.0
11
+ av==12.3.0
12
+ bddl==1.0.1
13
+ certifi==2025.11.12
14
+ charset-normalizer==3.4.4
15
+ click==8.3.1
16
+ cloudpickle==3.1.2
17
+ contourpy==1.3.2
18
+ cramjam==2.11.0
19
+ cycler==0.12.1
20
+ debugpy==1.8.19
21
+ decorator==5.2.1
22
+ decord==0.6.0
23
+ deepspeed==0.16.9
24
+ diffusers==0.36.0
25
+ docstring_parser==0.17.0
26
+ easydict==1.9
27
+ einops==0.8.1
28
+ etils==1.13.0
29
+ eva-decord==0.6.1
30
+ eval_type_backport==0.3.1
31
+ exceptiongroup==1.3.1
32
+ executing==2.2.1
33
+ fastjsonschema==2.21.2
34
+ fastparquet==2024.11.0
35
+ filelock==3.20.2
36
+ flash_attn==2.8.3
37
+ fonttools==4.61.1
38
+ fsspec==2025.12.0
39
+ future==0.18.2
40
+ fvcore==0.1.5.post20221221
41
+ gevent==25.9.1
42
+ gitdb==4.0.12
43
+ GitPython==3.1.46
44
+ glfw==2.10.0
45
+ greenlet==3.3.0
46
+ grpcio==1.76.0
47
+ gym==0.26.2
48
+ gym-notices==0.1.0
49
+ h11==0.16.0
50
+ hf-xet==1.2.0
51
+ hjson==3.1.0
52
+ httpcore==1.0.9
53
+ httpx==0.28.1
54
+ huggingface-hub==0.36.0
55
+ idna==3.11
56
+ ImageIO==2.37.2
57
+ importlib_metadata==8.7.1
58
+ importlib_resources==6.5.2
59
+ iniconfig==2.3.0
60
+ iopath==0.1.10
61
+ ipdb==0.13.13
62
+ ipython==8.37.0
63
+ jedi==0.19.2
64
+ Jinja2==3.1.6
65
+ jsonschema==4.17.3
66
+ jupyter_core==5.9.1
67
+ jupytext==1.18.1
68
+ kiwisolver==1.4.9
69
+ lazy_loader==0.4
70
+ libero==0.1.0
71
+ llvmlite==0.46.0
72
+ Markdown==3.10
73
+ markdown-it-py==4.0.0
74
+ MarkupSafe==3.0.3
75
+ matplotlib==3.10.8
76
+ matplotlib-inline==0.2.1
77
+ mdit-py-plugins==0.5.0
78
+ mdurl==0.1.2
79
+ mpmath==1.3.0
80
+ msgpack==1.1.2
81
+ mujoco==3.4.0
82
+ nbformat==5.10.4
83
+ networkx==3.4.2
84
+ ninja==1.13.0
85
+ numba==0.63.1
86
+ numpy==1.26.4
87
+ numpydantic==1.6.9
88
+ nvidia-cublas-cu12==12.4.5.8
89
+ nvidia-cuda-cupti-cu12==12.4.127
90
+ nvidia-cuda-nvrtc-cu12==12.4.127
91
+ nvidia-cuda-runtime-cu12==12.4.127
92
+ nvidia-cudnn-cu12==9.1.0.70
93
+ nvidia-cufft-cu12==11.2.1.3
94
+ nvidia-curand-cu12==10.3.5.147
95
+ nvidia-cusolver-cu12==11.6.1.9
96
+ nvidia-cusparse-cu12==12.3.1.170
97
+ nvidia-nccl-cu12==2.21.5
98
+ nvidia-nvjitlink-cu12==12.4.127
99
+ nvidia-nvtx-cu12==12.4.127
100
+ omegaconf==2.3.0
101
+ opencv-python==4.11.0.86
102
+ opencv-python-headless==4.11.0.86
103
+ packaging==25.0
104
+ pandas==2.3.3
105
+ parso==0.8.5
106
+ pexpect==4.9.0
107
+ pillow==12.1.0
108
+ pipablepytorch3d==0.7.6
109
+ platformdirs==4.5.1
110
+ pluggy==1.6.0
111
+ portalocker==3.2.0
112
+ prompt_toolkit==3.0.52
113
+ protobuf==6.33.2
114
+ psutil==7.2.1
115
+ ptyprocess==0.7.0
116
+ pure_eval==0.2.3
117
+ py-cpuinfo==9.0.0
118
+ pyarrow==14.0.1
119
+ pydantic==2.10.6
120
+ pydantic_core==2.27.2
121
+ Pygments==2.19.2
122
+ PyOpenGL==3.1.10
123
+ pyparsing==3.3.1
124
+ pyrsistent==0.20.0
125
+ pytest==9.0.2
126
+ python-dateutil==2.9.0.post0
127
+ pytz==2025.2
128
+ PyYAML==6.0.3
129
+ qwen-vl-utils==0.0.14
130
+ regex==2025.11.3
131
+ requests==2.32.5
132
+ rich==14.2.0
133
+ robosuite==1.4.0
134
+ safetensors==0.7.0
135
+ scikit-image==0.25.2
136
+ scipy==1.15.3
137
+ sentry-sdk==2.48.0
138
+ setuptools==80.9.0
139
+ six==1.17.0
140
+ smmap==5.0.2
141
+ stack-data==0.6.3
142
+ starVLA==1.0.1
143
+ sympy==1.13.1
144
+ tabulate==0.9.0
145
+ tensorboard==2.20.0
146
+ tensorboard-data-server==0.7.2
147
+ termcolor==3.3.0
148
+ tifffile==2025.5.10
149
+ tiktoken==0.12.0
150
+ timm==1.0.22
151
+ tokenizers==0.22.1
152
+ tomli==2.3.0
153
+ torch==2.5.1
154
+ torchvision==0.20.1
155
+ tqdm==4.67.1
156
+ traitlets==5.14.3
157
+ transformers==4.57.3
158
+ transformers-stream-generator==0.0.4
159
+ triton==3.1.0
160
+ typeguard==4.4.4
161
+ typing_extensions==4.15.0
162
+ tyro==1.0.3
163
+ tzdata==2025.3
164
+ urllib3==2.6.2
165
+ wandb==0.23.1
166
+ wcwidth==0.2.14
167
+ websocket==0.2.1
168
+ websocket-client==1.8.0
169
+ websockets==15.0.1
170
+ Werkzeug==3.1.4
171
+ yacs==0.1.8
172
+ zipp==3.23.0
173
+ zope.event==6.1
174
+ zope.interface==8.1.1
175
+ autocommand==2.2.2
176
+ backports.tarfile==1.2.0
177
+ importlib_metadata==8.0.0
178
+ inflect==7.3.1
179
+ jaraco.collections==5.1.0
180
+ jaraco.context==5.3.0
181
+ jaraco.functools==4.0.1
182
+ jaraco.text==3.12.1
183
+ more-itertools==10.3.0
184
+ packaging==24.2
185
+ platformdirs==4.2.2
186
+ tomli==2.0.1
187
+ typeguard==4.3.0
188
+ typing_extensions==4.12.2
189
+ wheel==0.45.1
190
+ zipp==3.19.2
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-metadata.json ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36",
3
+ "python": "CPython 3.10.19",
4
+ "startedAt": "2026-01-17T10:03:39.069637Z",
5
+ "args": [
6
+ "--config_yaml",
7
+ "scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml",
8
+ "--framework.name",
9
+ "QwenGR00T",
10
+ "--framework.qwenvl.base_vlm",
11
+ "/home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9",
12
+ "--datasets.vla_data.data_root_dir",
13
+ "./playground/Datasets/OXE_LEROBOT",
14
+ "--datasets.vla_data.data_mix",
15
+ "bridge_rt_1",
16
+ "--datasets.vla_data.per_device_batch_size",
17
+ "8",
18
+ "--trainer.freeze_modules",
19
+ "--trainer.max_train_steps",
20
+ "100000",
21
+ "--trainer.save_interval",
22
+ "10000",
23
+ "--trainer.logging_frequency",
24
+ "50",
25
+ "--trainer.eval_interval",
26
+ "200",
27
+ "--run_root_dir",
28
+ "./Checkpoints",
29
+ "--run_id",
30
+ "qwen3vl_bridge_rt1_QwenGR00T_0117_1747",
31
+ "--output_dir",
32
+ "./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747",
33
+ "--wandb.project",
34
+ "Qwen3VL_Bridge_RT1_QwenGR00T",
35
+ "--wandb.entity",
36
+ "lookas"
37
+ ],
38
+ "program": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py",
39
+ "codePath": "starVLA/training/train_starvla.py",
40
+ "codePathLocal": "starVLA/training/train_starvla.py",
41
+ "git": {
42
+ "remote": "https://github.com/hilookas/starVLA_pickxiguapi",
43
+ "commit": "ab531aff5b27795879c61f67892330a616e9dbf0"
44
+ },
45
+ "email": "hilookas@gmail.com",
46
+ "root": "./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb",
47
+ "host": "g340-cd51-7700-770-343f-3fec-69bb",
48
+ "executable": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3",
49
+ "cpu_count": 90,
50
+ "cpu_count_logical": 180,
51
+ "gpu": "NVIDIA H20",
52
+ "gpu_count": 8,
53
+ "disk": {
54
+ "/": {
55
+ "total": "3779301580800",
56
+ "used": "151673700352"
57
+ }
58
+ },
59
+ "memory": {
60
+ "total": "2071188119552"
61
+ },
62
+ "gpu_nvidia": [
63
+ {
64
+ "name": "NVIDIA H20",
65
+ "memoryTotal": "102625181696",
66
+ "cudaCores": 9984,
67
+ "architecture": "Hopper",
68
+ "uuid": "GPU-f99bae5f-ffca-4972-6420-64c42ba64f22"
69
+ },
70
+ {
71
+ "name": "NVIDIA H20",
72
+ "memoryTotal": "102625181696",
73
+ "cudaCores": 9984,
74
+ "architecture": "Hopper",
75
+ "uuid": "GPU-a00709c9-6bdf-4011-64dc-95421da94ba4"
76
+ },
77
+ {
78
+ "name": "NVIDIA H20",
79
+ "memoryTotal": "102625181696",
80
+ "cudaCores": 9984,
81
+ "architecture": "Hopper",
82
+ "uuid": "GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5"
83
+ },
84
+ {
85
+ "name": "NVIDIA H20",
86
+ "memoryTotal": "102625181696",
87
+ "cudaCores": 9984,
88
+ "architecture": "Hopper",
89
+ "uuid": "GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9"
90
+ },
91
+ {
92
+ "name": "NVIDIA H20",
93
+ "memoryTotal": "102625181696",
94
+ "cudaCores": 9984,
95
+ "architecture": "Hopper",
96
+ "uuid": "GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218"
97
+ },
98
+ {
99
+ "name": "NVIDIA H20",
100
+ "memoryTotal": "102625181696",
101
+ "cudaCores": 9984,
102
+ "architecture": "Hopper",
103
+ "uuid": "GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde"
104
+ },
105
+ {
106
+ "name": "NVIDIA H20",
107
+ "memoryTotal": "102625181696",
108
+ "cudaCores": 9984,
109
+ "architecture": "Hopper",
110
+ "uuid": "GPU-4fa493fc-c408-182f-138e-bcc15c7f9138"
111
+ },
112
+ {
113
+ "name": "NVIDIA H20",
114
+ "memoryTotal": "102625181696",
115
+ "cudaCores": 9984,
116
+ "architecture": "Hopper",
117
+ "uuid": "GPU-16ef9185-6132-8620-ad2e-1f8920ded508"
118
+ }
119
+ ],
120
+ "cudaVersion": "12.4",
121
+ "writerId": "qsdugxujhb6s3j19wae2dfqwajsgmsw2"
122
+ }
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"model_time":1.0015201809583232,"_wandb":{"runtime":115102},"data_time":0.002643669955432415,"epoch":0.85,"_step":100000,"_runtime":115102.355367037,"learning_rate":5e-07,"_timestamp":1.76875927504325e+09,"mse_score":0.007693730294704437,"action_dit_loss":0.05095190927386284}
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug-internal.log ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-17T18:03:45.356692165+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-17T18:03:48.552330417+08:00","level":"INFO","msg":"stream: created new stream","id":"xbap43rk"}
3
+ {"time":"2026-01-17T18:03:48.552524112+08:00","level":"INFO","msg":"handler: started","stream_id":"xbap43rk"}
4
+ {"time":"2026-01-17T18:03:48.577796615+08:00","level":"INFO","msg":"stream: started","id":"xbap43rk"}
5
+ {"time":"2026-01-17T18:03:48.577817586+08:00","level":"INFO","msg":"writer: started","stream_id":"xbap43rk"}
6
+ {"time":"2026-01-17T18:03:48.577832655+08:00","level":"INFO","msg":"sender: started","stream_id":"xbap43rk"}
7
+ {"time":"2026-01-17T20:02:17.852359064+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
8
+ {"time":"2026-01-17T20:04:33.007831623+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
9
+ {"time":"2026-01-17T20:35:32.863685268+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
10
+ {"time":"2026-01-17T22:03:46.318542143+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
11
+ {"time":"2026-01-17T22:48:34.635180932+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
12
+ {"time":"2026-01-17T22:55:57.518503703+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
13
+ {"time":"2026-01-17T23:07:48.293218261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
14
+ {"time":"2026-01-17T23:08:32.231325893+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-17T23:12:50.87203047+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
16
+ {"time":"2026-01-17T23:13:18.698788758+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": http2: client conn is closed"}
17
+ {"time":"2026-01-17T23:16:49.881636821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
18
+ {"time":"2026-01-17T23:25:00.472362504+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
19
+ {"time":"2026-01-18T00:16:02.236615436+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
20
+ {"time":"2026-01-18T00:33:00.268425846+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
21
+ {"time":"2026-01-18T00:33:13.186386827+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
22
+ {"time":"2026-01-18T02:52:45.26127457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
23
+ {"time":"2026-01-18T02:53:30.366178096+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
24
+ {"time":"2026-01-18T04:54:45.36780745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
25
+ {"time":"2026-01-18T04:55:30.238642915+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
26
+ {"time":"2026-01-18T04:55:42.722661208+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
27
+ {"time":"2026-01-18T04:56:15.382797183+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
28
+ {"time":"2026-01-18T08:43:45.342343851+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
29
+ {"time":"2026-01-18T08:44:00.358330288+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
30
+ {"time":"2026-01-18T08:44:30.251461638+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
31
+ {"time":"2026-01-18T10:47:45.345590419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
32
+ {"time":"2026-01-18T12:47:15.286316861+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
33
+ {"time":"2026-01-18T13:40:46.383240786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
34
+ {"time":"2026-01-18T16:22:00.269227917+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
35
+ {"time":"2026-01-18T16:23:00.259212087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
36
+ {"time":"2026-01-18T16:26:15.279544821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
37
+ {"time":"2026-01-18T16:28:15.394951264+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
38
+ {"time":"2026-01-18T16:28:28.376139107+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
39
+ {"time":"2026-01-18T16:32:34.771745298+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
40
+ {"time":"2026-01-18T16:32:50.854108579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
41
+ {"time":"2026-01-18T16:33:15.253909146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
42
+ {"time":"2026-01-18T16:33:30.268871735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
43
+ {"time":"2026-01-18T16:33:45.254149217+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
44
+ {"time":"2026-01-18T16:33:57.84608755+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
45
+ {"time":"2026-01-18T16:34:14.118425621+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
46
+ {"time":"2026-01-18T16:34:26.791643445+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
47
+ {"time":"2026-01-18T16:35:30.392649391+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
48
+ {"time":"2026-01-18T16:35:45.390391138+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
49
+ {"time":"2026-01-18T16:37:00.231753869+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
50
+ {"time":"2026-01-18T16:39:00.308923433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
51
+ {"time":"2026-01-18T16:50:44.109993399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
52
+ {"time":"2026-01-18T16:56:44.222721195+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
53
+ {"time":"2026-01-18T16:56:59.182350472+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
54
+ {"time":"2026-01-18T16:57:12.200012616+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
55
+ {"time":"2026-01-18T16:57:30.278294605+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
56
+ {"time":"2026-01-18T16:57:45.272613563+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
57
+ {"time":"2026-01-18T16:57:58.361466419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
58
+ {"time":"2026-01-18T16:58:16.374502713+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
59
+ {"time":"2026-01-18T17:01:49.770643385+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
60
+ {"time":"2026-01-18T17:03:00.288457229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
61
+ {"time":"2026-01-18T17:03:45.353334974+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
62
+ {"time":"2026-01-18T18:17:45.365055726+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
63
+ {"time":"2026-01-18T18:24:00.357867283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
64
+ {"time":"2026-01-18T19:06:15.375047877+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
65
+ {"time":"2026-01-18T19:06:28.413756607+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
66
+ {"time":"2026-01-18T19:15:30.232002999+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
67
+ {"time":"2026-01-18T19:39:30.251864251+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
68
+ {"time":"2026-01-18T19:40:00.288831216+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
69
+ {"time":"2026-01-18T19:52:30.252619907+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
70
+ {"time":"2026-01-18T20:51:49.773485296+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
71
+ {"time":"2026-01-18T21:32:54.188737252+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
72
+ {"time":"2026-01-18T22:14:31.789385651+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
73
+ {"time":"2026-01-19T00:11:15.393839366+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
74
+ {"time":"2026-01-19T00:50:30.380524837+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
75
+ {"time":"2026-01-19T00:51:00.395000654+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
76
+ {"time":"2026-01-19T00:51:13.162530742+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
77
+ {"time":"2026-01-19T00:54:30.249839041+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
78
+ {"time":"2026-01-19T00:55:30.349433303+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
79
+ {"time":"2026-01-19T01:00:31.333972122+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
80
+ {"time":"2026-01-19T01:19:30.367251508+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
81
+ {"time":"2026-01-19T01:20:30.296201955+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
82
+ {"time":"2026-01-19T01:51:00.221611746+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
83
+ {"time":"2026-01-19T01:52:30.445846213+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
84
+ {"time":"2026-01-19T02:02:15.651403576+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
85
+ {"time":"2026-01-19T02:02:17.343084437+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
86
+ {"time":"2026-01-19T02:02:17.352284781+08:00","level":"INFO","msg":"stream: closing","id":"xbap43rk"}
87
+ {"time":"2026-01-19T02:02:17.35229661+08:00","level":"INFO","msg":"handler: closed","stream_id":"xbap43rk"}
88
+ {"time":"2026-01-19T02:02:17.384196864+08:00","level":"INFO","msg":"sender: closed","stream_id":"xbap43rk"}
89
+ {"time":"2026-01-19T02:02:17.384209276+08:00","level":"INFO","msg":"stream: closed","id":"xbap43rk"}
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/run-xbap43rk.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7eb50f80f1190a86e2744977be0372f4150f63c16e050177b613fb7d1e84338
3
+ size 110227380
qwen3vl_bridge_rt1_QwenOFT_0112_1323/config.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
4
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
5
+ data_mix: bridge_rt_1
6
+ data_root_dir: ./playground/Datasets/OXE_LEROBOT
7
+ dataset_py: lerobot_datasets
8
+ image_size:
9
+ - 224
10
+ - 224
11
+ per_device_batch_size: 8
12
+ video_backend: torchvision_av
13
+ framework:
14
+ action_model:
15
+ action_dim: 7
16
+ action_hidden_dim: 4096
17
+ action_model_type: DiT-B
18
+ future_action_window_size: 15
19
+ past_action_window_size: 0
20
+ name: QwenOFT
21
+ qwenvl:
22
+ base_vlm: /home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
23
+ output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323
24
+ run_id: qwen3vl_bridge_rt1_QwenOFT_0112_1323
25
+ run_root_dir: ./Checkpoints
26
+ seed: 42
27
+ trainer:
28
+ eval_interval: 200
29
+ freeze_modules: true
30
+ gradient_accumulation_steps: 1
31
+ gradient_clipping: 1.0
32
+ is_resume: false
33
+ learning_rate:
34
+ action_model: 0.0001
35
+ base: 1.0e-05
36
+ qwen_vl_interface: 1.0e-05
37
+ logging_frequency: 50
38
+ lr_scheduler_type: cosine_with_min_lr
39
+ max_train_steps: 100000
40
+ num_warmup_steps: 10000
41
+ optimizer:
42
+ betas:
43
+ - 0.9
44
+ - 0.95
45
+ eps: 1.0e-08
46
+ weight_decay: 1.0e-08
47
+ save_interval: 10000
48
+ scheduler_specific_kwargs:
49
+ min_lr: 5.0e-07
50
+ wandb_entity: lookas
51
+ wandb_project: Qwen3VL_Bridge_RT1_OFT
qwen3vl_bridge_rt1_QwenOFT_0112_1323/dataset_statistics.json ADDED
@@ -0,0 +1,264 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "oxe_bridge": {
3
+ "action": {
4
+ "mean": [
5
+ 0.00011365935642970726,
6
+ 6.556110747624189e-05,
7
+ -6.320965621853247e-05,
8
+ -7.205353176686913e-05,
9
+ -0.00019515302847139537,
10
+ 0.0001203166029881686,
11
+ 0.28829458355903625
12
+ ],
13
+ "std": [
14
+ 0.006909770731857718,
15
+ 0.009684093232852218,
16
+ 0.00896290498528129,
17
+ 0.020121052930683073,
18
+ 0.021582655517295487,
19
+ 0.054723342223346974,
20
+ 0.4543627821514982
21
+ ],
22
+ "max": [
23
+ 0.41691166162490845,
24
+ 0.25864794850349426,
25
+ 0.21218234300613403,
26
+ 3.122201919555664,
27
+ 1.8618112802505493,
28
+ 6.272472858428955,
29
+ 1.0
30
+ ],
31
+ "min": [
32
+ -0.4007510244846344,
33
+ -0.13874775171279907,
34
+ -0.22553899884223938,
35
+ -3.2010786533355713,
36
+ -1.8618112802505493,
37
+ -6.279075622558594,
38
+ 0.0
39
+ ],
40
+ "q01": [
41
+ -0.02875255048274994,
42
+ -0.04170213546603918,
43
+ -0.026096721179783344,
44
+ -0.08052874729037285,
45
+ -0.09249906800687313,
46
+ -0.20738555490970612,
47
+ 0.0
48
+ ],
49
+ "q99": [
50
+ 0.028306663036346436,
51
+ 0.04089853074401617,
52
+ 0.0401805154979229,
53
+ 0.08173403143882751,
54
+ 0.07760760560631752,
55
+ 0.2038465365767479,
56
+ 1.0
57
+ ],
58
+ "mask": [
59
+ true,
60
+ true,
61
+ true,
62
+ true,
63
+ true,
64
+ true,
65
+ false
66
+ ]
67
+ },
68
+ "state": {
69
+ "mean": [
70
+ 0.15471743047237396,
71
+ 0.015362550504505634,
72
+ 0.03222028166055679,
73
+ 0.0032453201711177826,
74
+ -0.038600146770477295,
75
+ 0.05382946878671646,
76
+ 0.0,
77
+ 0.35406652092933655
78
+ ],
79
+ "std": [
80
+ 0.1605359274864927,
81
+ 0.06677912092232112,
82
+ 0.048657150951527554,
83
+ 0.09275336958940797,
84
+ 0.12566984746914736,
85
+ 0.41222738578801793,
86
+ 0.0,
87
+ 0.4330223535305803
88
+ ],
89
+ "max": [
90
+ 0.5862360596656799,
91
+ 0.4034728705883026,
92
+ 0.3568263053894043,
93
+ 1.3517684936523438,
94
+ 1.570796251296997,
95
+ 3.141204357147217,
96
+ 0.0,
97
+ 1.1121242046356201
98
+ ],
99
+ "min": [
100
+ -0.04167502000927925,
101
+ -0.3563207685947418,
102
+ -0.15537554025650024,
103
+ -3.141592502593994,
104
+ -1.4992541074752808,
105
+ -3.14153790473938,
106
+ 0.0,
107
+ 0.04637829214334488
108
+ ],
109
+ "q01": [
110
+ 0.17102622985839844,
111
+ -0.1698118858039379,
112
+ -0.055632163770496845,
113
+ -0.36493172496557236,
114
+ -0.541871190071106,
115
+ -1.354275494813919,
116
+ 0.0,
117
+ 0.052190229296684265
118
+ ],
119
+ "q99": [
120
+ 0.45322076976299286,
121
+ 0.2354845181107521,
122
+ 0.19489620998501778,
123
+ 0.3780156075954437,
124
+ 0.27568644285202026,
125
+ 1.8500566184520721,
126
+ 0.0,
127
+ 1.0105689764022827
128
+ ]
129
+ },
130
+ "num_transitions": 1305714,
131
+ "num_trajectories": 53192
132
+ },
133
+ "oxe_rt1": {
134
+ "action": {
135
+ "mean": [
136
+ 0.003493750700727105,
137
+ 0.003132961690425873,
138
+ -0.0063125672750175,
139
+ 0.02166595682501793,
140
+ -0.0028780836146324873,
141
+ 0.0004565489653032273,
142
+ 0.26771023869514465
143
+ ],
144
+ "std": [
145
+ 0.049065014465362655,
146
+ 0.04229853739828572,
147
+ 0.05237628880142378,
148
+ 0.1124860236500875,
149
+ 0.09312952783816872,
150
+ 0.10319098309601091,
151
+ 0.4418448662622395
152
+ ],
153
+ "max": [
154
+ 2.9984593391418457,
155
+ 22.09052848815918,
156
+ 2.7507524490356445,
157
+ 1.570636510848999,
158
+ 1.5321086645126343,
159
+ 1.5691522359848022,
160
+ 1.0
161
+ ],
162
+ "min": [
163
+ -2.0204520225524902,
164
+ -5.497899532318115,
165
+ -2.031663417816162,
166
+ -1.569917917251587,
167
+ -1.569892168045044,
168
+ -1.570419430732727,
169
+ 0.0
170
+ ],
171
+ "q01": [
172
+ -0.22453527510166169,
173
+ -0.14820013284683228,
174
+ -0.231589707583189,
175
+ -0.3517994859814644,
176
+ -0.4193011274933815,
177
+ -0.43643461108207704,
178
+ 0.0
179
+ ],
180
+ "q99": [
181
+ 0.17824687153100965,
182
+ 0.14938379630446405,
183
+ 0.21842354819178575,
184
+ 0.5892666035890578,
185
+ 0.35272657424211445,
186
+ 0.44796681255102094,
187
+ 1.0
188
+ ],
189
+ "mask": [
190
+ true,
191
+ true,
192
+ true,
193
+ true,
194
+ true,
195
+ true,
196
+ false
197
+ ]
198
+ },
199
+ "state": {
200
+ "mean": [
201
+ 0.2799473702907562,
202
+ -0.04167069122195244,
203
+ 0.38854750990867615,
204
+ 0.21306729316711426,
205
+ -0.12402277439832687,
206
+ 0.24756911396980286,
207
+ 0.046330634504556656,
208
+ 0.10487449914216995
209
+ ],
210
+ "std": [
211
+ 0.29342642876909925,
212
+ 0.09174024655686211,
213
+ 0.42569508885539115,
214
+ 0.38616252611341306,
215
+ 0.38314586427420927,
216
+ 0.44433568806919804,
217
+ 0.1263927443679382,
218
+ 0.22122596673781084
219
+ ],
220
+ "max": [
221
+ 1.0534898042678833,
222
+ 0.48018959164619446,
223
+ 1.6896663904190063,
224
+ 1.0,
225
+ 0.9999993443489075,
226
+ 0.9999874830245972,
227
+ 0.9554369449615479,
228
+ 0.9914546012878418
229
+ ],
230
+ "min": [
231
+ -0.4436439275741577,
232
+ -0.9970501065254211,
233
+ -0.006579156965017319,
234
+ 0.0,
235
+ -0.8643477559089661,
236
+ -0.7079970240592957,
237
+ -0.7688722014427185,
238
+ -0.4999994933605194
239
+ ],
240
+ "q01": [
241
+ 0.32481380939483645,
242
+ -0.28334290891885755,
243
+ 0.14107070609927178,
244
+ 0.0,
245
+ -0.686474204659462,
246
+ -0.6808923494815826,
247
+ -0.36045596331357954,
248
+ -0.454380963742733
249
+ ],
250
+ "q99": [
251
+ 0.8750156319141384,
252
+ 0.21247054174542404,
253
+ 1.0727112340927123,
254
+ 1.0,
255
+ 0.9377871316671368,
256
+ 0.9563051050901409,
257
+ 0.45990042358636823,
258
+ 0.7216041100025177
259
+ ]
260
+ },
261
+ "num_transitions": 3786152,
262
+ "num_trajectories": 87212
263
+ }
264
+ }
qwen3vl_bridge_rt1_QwenOFT_0112_1323/run_qwen3vl_bridge_rt1_qwen_oft.sh ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Framework_name=QwenOFT
2
+ dit_type="DiT-B"
3
+ freeze_module_list='' # fully FT, e.g., freeze_module_list=""
4
+ data_mix=bridge_rt_1
5
+
6
+ ## Modify below paths before running ##
7
+ date_time=$(date +%m%d_%H%M)
8
+ config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
9
+ base_vlm=/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
10
+ data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
11
+ run_root_dir=./Checkpoints
12
+ run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
13
+ batch_size=8
14
+ wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
15
+ wandb_entity=lookas
16
+
17
+ # export WANDB_MODE=disabled
18
+
19
+ output_dir=${run_root_dir}/${run_id}
20
+ mkdir -p ${output_dir}
21
+ cp $0 ${output_dir}/
22
+
23
+
24
+ accelerate launch --main_process_port 12773 \
25
+ --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
26
+ --num_processes 8 \
27
+ starVLA/training/train_starvla.py \
28
+ --config_yaml ${config_yaml} \
29
+ --framework.name ${Framework_name} \
30
+ --framework.qwenvl.base_vlm ${base_vlm} \
31
+ --datasets.vla_data.data_root_dir ${data_root_dir}\
32
+ --datasets.vla_data.data_mix ${data_mix} \
33
+ --datasets.vla_data.per_device_batch_size ${batch_size} \
34
+ --trainer.freeze_modules ${freeze_module_list} \
35
+ --trainer.max_train_steps 100000 \
36
+ --trainer.save_interval 10000 \
37
+ --trainer.logging_frequency 50 \
38
+ --trainer.eval_interval 200 \
39
+ --run_root_dir ${run_root_dir} \
40
+ --run_id ${run_id} \
41
+ --output_dir ${output_dir} \
42
+ --wandb.project ${wandb_project} \
43
+ --wandb.entity ${wandb_entity}
44
+
45
+
46
+ # multi-node launch example
47
+
48
+ # accelerate launch \
49
+ # --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
50
+ # --main_process_ip $MASTER_ADDR \
51
+ # --main_process_port $MASTER_PORT \
52
+ # --machine_rank $SLURM_PROCID \
53
+ # --num_machines $SLURM_NNODES \
54
+ # --num_processes=${TOTAL_GPUS} \
55
+ # starVLA/training/train_starvla.py \
56
+ # --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
57
+ # --framework.framework_py QwenGR00T \
58
+ # --framework.qwenvl.base_vlm microsoft/Florence-2-large \
59
+ # --run_root_dir ${run_root_dir} \
60
+ # --run_id ${run_id} \
61
+ # --wandb_project your_project \
62
+ # --wandb_entity your_name
qwen3vl_bridge_rt1_QwenOFT_0112_1323/summary.jsonl ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {"steps": 10000}
2
+ {"steps": 20000}
3
+ {"steps": 30000}
4
+ {"steps": 40000}
5
+ {"steps": 50000}
6
+ {"steps": 60000}
7
+ {"steps": 70000}
8
+ {"steps": 80000}
9
+ {"steps": 90000}
10
+ {"steps": 100000}
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug-internal.log ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-12T13:33:02.374820947+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-12T13:33:03.82154982+08:00","level":"INFO","msg":"stream: created new stream","id":"ueywjhk5"}
3
+ {"time":"2026-01-12T13:33:03.821725323+08:00","level":"INFO","msg":"handler: started","stream_id":"ueywjhk5"}
4
+ {"time":"2026-01-12T13:33:03.846752186+08:00","level":"INFO","msg":"stream: started","id":"ueywjhk5"}
5
+ {"time":"2026-01-12T13:33:03.846770681+08:00","level":"INFO","msg":"writer: started","stream_id":"ueywjhk5"}
6
+ {"time":"2026-01-12T13:33:03.846770288+08:00","level":"INFO","msg":"sender: started","stream_id":"ueywjhk5"}
7
+ {"time":"2026-01-12T14:18:31.589248229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
8
+ {"time":"2026-01-12T14:39:00.33374833+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
9
+ {"time":"2026-01-12T14:45:00.196854395+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
10
+ {"time":"2026-01-12T15:30:49.608798424+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": net/http: request canceled while waiting for connection (Client.Timeout exceeded while awaiting headers)"}
11
+ {"time":"2026-01-12T15:58:15.168936649+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
12
+ {"time":"2026-01-12T16:32:15.169856477+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
13
+ {"time":"2026-01-12T16:32:28.120660769+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
14
+ {"time":"2026-01-12T18:52:15.110123119+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-12T20:25:15.093766297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
16
+ {"time":"2026-01-12T20:46:29.622105415+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": Gateway Timeout"}
17
+ {"time":"2026-01-12T20:57:51.676789447+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
18
+ {"time":"2026-01-12T21:34:03.873286543+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
19
+ {"time":"2026-01-12T21:57:16.546518785+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
20
+ {"time":"2026-01-12T22:29:15.864952943+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
21
+ {"time":"2026-01-12T22:36:13.618868987+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
22
+ {"time":"2026-01-12T22:36:31.272703076+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
23
+ {"time":"2026-01-13T00:17:45.174009838+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
24
+ {"time":"2026-01-13T00:17:57.789671331+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
25
+ {"time":"2026-01-13T00:18:45.160525879+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
26
+ {"time":"2026-01-13T01:22:18.006447633+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
27
+ {"time":"2026-01-13T02:03:21.340298852+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
28
+ {"time":"2026-01-13T03:04:34.668877357+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
29
+ {"time":"2026-01-13T03:04:47.661210297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
30
+ {"time":"2026-01-13T03:12:30.235091077+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
31
+ {"time":"2026-01-13T03:13:15.087092941+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
32
+ {"time":"2026-01-13T05:33:30.27306441+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
33
+ {"time":"2026-01-13T05:33:45.195585087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
34
+ {"time":"2026-01-13T05:34:15.047256192+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
35
+ {"time":"2026-01-13T06:34:30.165692234+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
36
+ {"time":"2026-01-13T06:34:42.845804108+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
37
+ {"time":"2026-01-13T06:34:59.430634519+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
38
+ {"time":"2026-01-13T06:35:45.090534347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
39
+ {"time":"2026-01-13T06:38:45.24671956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
40
+ {"time":"2026-01-13T06:40:00.085760676+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
41
+ {"time":"2026-01-13T06:40:30.253594276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
42
+ {"time":"2026-01-13T06:40:45.119737819+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
43
+ {"time":"2026-01-13T06:41:01.006178451+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
44
+ {"time":"2026-01-13T09:01:01.259781836+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
45
+ {"time":"2026-01-13T10:20:27.160154786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
46
+ {"time":"2026-01-13T11:23:00.198050425+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
47
+ {"time":"2026-01-13T11:24:00.137963825+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
48
+ {"time":"2026-01-13T11:41:16.643086394+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
49
+ {"time":"2026-01-13T12:21:36.803454674+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
50
+ {"time":"2026-01-13T12:29:23.122571501+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
51
+ {"time":"2026-01-13T12:59:15.208303261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
52
+ {"time":"2026-01-13T13:06:15.210877761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
53
+ {"time":"2026-01-13T13:06:27.856833979+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
54
+ {"time":"2026-01-13T13:09:06.355015154+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
55
+ {"time":"2026-01-13T13:40:00.126142378+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
56
+ {"time":"2026-01-13T13:46:32.168389695+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
57
+ {"time":"2026-01-13T13:48:15.081349554+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
58
+ {"time":"2026-01-13T13:57:00.197403381+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
59
+ {"time":"2026-01-13T15:57:25.317460174+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
60
+ {"time":"2026-01-13T15:59:46.726236225+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
61
+ {"time":"2026-01-13T16:09:46.448847236+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
62
+ {"time":"2026-01-13T16:58:01.095875797+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
63
+ {"time":"2026-01-13T17:24:10.021730043+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
64
+ {"time":"2026-01-13T18:27:15.075407399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
65
+ {"time":"2026-01-13T18:36:00.080917996+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
66
+ {"time":"2026-01-13T18:36:30.217018153+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
67
+ {"time":"2026-01-13T18:38:00.137187254+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
68
+ {"time":"2026-01-13T18:54:07.673379631+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
69
+ {"time":"2026-01-13T19:07:00.253334334+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
70
+ {"time":"2026-01-13T19:15:30.09514757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
71
+ {"time":"2026-01-13T20:25:51.505745758+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
72
+ {"time":"2026-01-13T21:59:51.560168548+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
73
+ {"time":"2026-01-13T23:25:27.580587803+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
74
+ {"time":"2026-01-13T23:25:28.86707285+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
75
+ {"time":"2026-01-13T23:25:28.876898999+08:00","level":"INFO","msg":"stream: closing","id":"ueywjhk5"}
76
+ {"time":"2026-01-13T23:25:28.876914442+08:00","level":"INFO","msg":"handler: closed","stream_id":"ueywjhk5"}
77
+ {"time":"2026-01-13T23:25:28.90868024+08:00","level":"INFO","msg":"sender: closed","stream_id":"ueywjhk5"}
78
+ {"time":"2026-01-13T23:25:28.90870897+08:00","level":"INFO","msg":"stream: closed","id":"ueywjhk5"}
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/config.yaml ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.23.1
4
+ e:
5
+ 3h4xzexd9mhzcjwlbp7j0zfzyqq963et:
6
+ args:
7
+ - --config_yaml
8
+ - scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
9
+ - --framework.name
10
+ - QwenOFT
11
+ - --framework.qwenvl.base_vlm
12
+ - /home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
13
+ - --datasets.vla_data.data_root_dir
14
+ - ./playground/Datasets/OXE_LEROBOT
15
+ - --datasets.vla_data.data_mix
16
+ - bridge_rt_1
17
+ - --datasets.vla_data.per_device_batch_size
18
+ - "8"
19
+ - --trainer.freeze_modules
20
+ - --trainer.max_train_steps
21
+ - "100000"
22
+ - --trainer.save_interval
23
+ - "10000"
24
+ - --trainer.logging_frequency
25
+ - "50"
26
+ - --trainer.eval_interval
27
+ - "200"
28
+ - --run_root_dir
29
+ - ./Checkpoints
30
+ - --run_id
31
+ - qwen3vl_bridge_rt1_QwenOFT_0112_1323
32
+ - --output_dir
33
+ - ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323
34
+ - --wandb.project
35
+ - Qwen3VL_Bridge_RT1_QwenOFT
36
+ - --wandb.entity
37
+ - lookas
38
+ codePath: starVLA/training/train_starvla.py
39
+ codePathLocal: starVLA/training/train_starvla.py
40
+ cpu_count: 90
41
+ cpu_count_logical: 180
42
+ cudaVersion: "12.4"
43
+ disk:
44
+ /:
45
+ total: "3779301580800"
46
+ used: "159098298368"
47
+ email: hilookas@gmail.com
48
+ executable: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3
49
+ git:
50
+ commit: ab531aff5b27795879c61f67892330a616e9dbf0
51
+ remote: https://github.com/hilookas/starVLA_pickxiguapi
52
+ gpu: NVIDIA H20
53
+ gpu_count: 8
54
+ gpu_nvidia:
55
+ - architecture: Hopper
56
+ cudaCores: 9984
57
+ memoryTotal: "102625181696"
58
+ name: NVIDIA H20
59
+ uuid: GPU-f99bae5f-ffca-4972-6420-64c42ba64f22
60
+ - architecture: Hopper
61
+ cudaCores: 9984
62
+ memoryTotal: "102625181696"
63
+ name: NVIDIA H20
64
+ uuid: GPU-a00709c9-6bdf-4011-64dc-95421da94ba4
65
+ - architecture: Hopper
66
+ cudaCores: 9984
67
+ memoryTotal: "102625181696"
68
+ name: NVIDIA H20
69
+ uuid: GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5
70
+ - architecture: Hopper
71
+ cudaCores: 9984
72
+ memoryTotal: "102625181696"
73
+ name: NVIDIA H20
74
+ uuid: GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9
75
+ - architecture: Hopper
76
+ cudaCores: 9984
77
+ memoryTotal: "102625181696"
78
+ name: NVIDIA H20
79
+ uuid: GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218
80
+ - architecture: Hopper
81
+ cudaCores: 9984
82
+ memoryTotal: "102625181696"
83
+ name: NVIDIA H20
84
+ uuid: GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde
85
+ - architecture: Hopper
86
+ cudaCores: 9984
87
+ memoryTotal: "102625181696"
88
+ name: NVIDIA H20
89
+ uuid: GPU-4fa493fc-c408-182f-138e-bcc15c7f9138
90
+ - architecture: Hopper
91
+ cudaCores: 9984
92
+ memoryTotal: "102625181696"
93
+ name: NVIDIA H20
94
+ uuid: GPU-16ef9185-6132-8620-ad2e-1f8920ded508
95
+ host: g340-cd51-7700-770-343f-3fec-69bb
96
+ memory:
97
+ total: "2071188119552"
98
+ os: Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36
99
+ program: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py
100
+ python: CPython 3.10.19
101
+ root: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb
102
+ startedAt: "2026-01-12T05:32:56.070975Z"
103
+ writerId: 3h4xzexd9mhzcjwlbp7j0zfzyqq963et
104
+ m: []
105
+ python_version: 3.10.19
106
+ t:
107
+ "1":
108
+ - 1
109
+ - 11
110
+ - 41
111
+ - 49
112
+ - 63
113
+ - 71
114
+ - 80
115
+ - 83
116
+ "2":
117
+ - 1
118
+ - 11
119
+ - 41
120
+ - 49
121
+ - 63
122
+ - 71
123
+ - 80
124
+ - 83
125
+ "3":
126
+ - 2
127
+ - 13
128
+ - 61
129
+ "4": 3.10.19
130
+ "5": 0.23.1
131
+ "6": 4.57.3
132
+ "12": 0.23.1
133
+ "13": linux-x86_64
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/requirements.txt ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ starVLA==1.0.1
2
+ absl-py==2.3.1
3
+ accelerate==1.5.2
4
+ albucore==0.0.17
5
+ albumentations==1.4.18
6
+ annotated-types==0.7.0
7
+ antlr4-python3-runtime==4.9.3
8
+ anyio==4.12.0
9
+ asttokens==3.0.1
10
+ attrs==20.3.0
11
+ av==12.3.0
12
+ bddl==1.0.1
13
+ certifi==2025.11.12
14
+ charset-normalizer==3.4.4
15
+ click==8.3.1
16
+ cloudpickle==3.1.2
17
+ contourpy==1.3.2
18
+ cramjam==2.11.0
19
+ cycler==0.12.1
20
+ debugpy==1.8.19
21
+ decorator==5.2.1
22
+ decord==0.6.0
23
+ deepspeed==0.16.9
24
+ diffusers==0.36.0
25
+ docstring_parser==0.17.0
26
+ easydict==1.9
27
+ einops==0.8.1
28
+ etils==1.13.0
29
+ eva-decord==0.6.1
30
+ eval_type_backport==0.3.1
31
+ exceptiongroup==1.3.1
32
+ executing==2.2.1
33
+ fastjsonschema==2.21.2
34
+ fastparquet==2024.11.0
35
+ filelock==3.20.2
36
+ flash_attn==2.8.3
37
+ fonttools==4.61.1
38
+ fsspec==2025.12.0
39
+ future==0.18.2
40
+ fvcore==0.1.5.post20221221
41
+ gevent==25.9.1
42
+ gitdb==4.0.12
43
+ GitPython==3.1.46
44
+ glfw==2.10.0
45
+ greenlet==3.3.0
46
+ grpcio==1.76.0
47
+ gym==0.26.2
48
+ gym-notices==0.1.0
49
+ h11==0.16.0
50
+ hf-xet==1.2.0
51
+ hjson==3.1.0
52
+ httpcore==1.0.9
53
+ httpx==0.28.1
54
+ huggingface-hub==0.36.0
55
+ idna==3.11
56
+ ImageIO==2.37.2
57
+ importlib_metadata==8.7.1
58
+ importlib_resources==6.5.2
59
+ iniconfig==2.3.0
60
+ iopath==0.1.10
61
+ ipdb==0.13.13
62
+ ipython==8.37.0
63
+ jedi==0.19.2
64
+ Jinja2==3.1.6
65
+ jsonschema==4.17.3
66
+ jupyter_core==5.9.1
67
+ jupytext==1.18.1
68
+ kiwisolver==1.4.9
69
+ lazy_loader==0.4
70
+ libero==0.1.0
71
+ llvmlite==0.46.0
72
+ Markdown==3.10
73
+ markdown-it-py==4.0.0
74
+ MarkupSafe==3.0.3
75
+ matplotlib==3.10.8
76
+ matplotlib-inline==0.2.1
77
+ mdit-py-plugins==0.5.0
78
+ mdurl==0.1.2
79
+ mpmath==1.3.0
80
+ msgpack==1.1.2
81
+ mujoco==3.4.0
82
+ nbformat==5.10.4
83
+ networkx==3.4.2
84
+ ninja==1.13.0
85
+ numba==0.63.1
86
+ numpy==1.26.4
87
+ numpydantic==1.6.9
88
+ nvidia-cublas-cu12==12.4.5.8
89
+ nvidia-cuda-cupti-cu12==12.4.127
90
+ nvidia-cuda-nvrtc-cu12==12.4.127
91
+ nvidia-cuda-runtime-cu12==12.4.127
92
+ nvidia-cudnn-cu12==9.1.0.70
93
+ nvidia-cufft-cu12==11.2.1.3
94
+ nvidia-curand-cu12==10.3.5.147
95
+ nvidia-cusolver-cu12==11.6.1.9
96
+ nvidia-cusparse-cu12==12.3.1.170
97
+ nvidia-nccl-cu12==2.21.5
98
+ nvidia-nvjitlink-cu12==12.4.127
99
+ nvidia-nvtx-cu12==12.4.127
100
+ omegaconf==2.3.0
101
+ opencv-python==4.11.0.86
102
+ opencv-python-headless==4.11.0.86
103
+ packaging==25.0
104
+ pandas==2.3.3
105
+ parso==0.8.5
106
+ pexpect==4.9.0
107
+ pillow==12.1.0
108
+ pipablepytorch3d==0.7.6
109
+ platformdirs==4.5.1
110
+ pluggy==1.6.0
111
+ portalocker==3.2.0
112
+ prompt_toolkit==3.0.52
113
+ protobuf==6.33.2
114
+ psutil==7.2.1
115
+ ptyprocess==0.7.0
116
+ pure_eval==0.2.3
117
+ py-cpuinfo==9.0.0
118
+ pyarrow==14.0.1
119
+ pydantic==2.10.6
120
+ pydantic_core==2.27.2
121
+ Pygments==2.19.2
122
+ PyOpenGL==3.1.10
123
+ pyparsing==3.3.1
124
+ pyrsistent==0.20.0
125
+ pytest==9.0.2
126
+ python-dateutil==2.9.0.post0
127
+ pytz==2025.2
128
+ PyYAML==6.0.3
129
+ qwen-vl-utils==0.0.14
130
+ regex==2025.11.3
131
+ requests==2.32.5
132
+ rich==14.2.0
133
+ robosuite==1.4.0
134
+ safetensors==0.7.0
135
+ scikit-image==0.25.2
136
+ scipy==1.15.3
137
+ sentry-sdk==2.48.0
138
+ setuptools==80.9.0
139
+ six==1.17.0
140
+ smmap==5.0.2
141
+ stack-data==0.6.3
142
+ starVLA==1.0.1
143
+ sympy==1.13.1
144
+ tabulate==0.9.0
145
+ tensorboard==2.20.0
146
+ tensorboard-data-server==0.7.2
147
+ termcolor==3.3.0
148
+ tifffile==2025.5.10
149
+ tiktoken==0.12.0
150
+ timm==1.0.22
151
+ tokenizers==0.22.1
152
+ tomli==2.3.0
153
+ torch==2.5.1
154
+ torchvision==0.20.1
155
+ tqdm==4.67.1
156
+ traitlets==5.14.3
157
+ transformers==4.57.3
158
+ transformers-stream-generator==0.0.4
159
+ triton==3.1.0
160
+ typeguard==4.4.4
161
+ typing_extensions==4.15.0
162
+ tyro==1.0.3
163
+ tzdata==2025.3
164
+ urllib3==2.6.2
165
+ wandb==0.23.1
166
+ wcwidth==0.2.14
167
+ websocket==0.2.1
168
+ websocket-client==1.8.0
169
+ websockets==15.0.1
170
+ Werkzeug==3.1.4
171
+ yacs==0.1.8
172
+ zipp==3.23.0
173
+ zope.event==6.1
174
+ zope.interface==8.1.1
175
+ autocommand==2.2.2
176
+ backports.tarfile==1.2.0
177
+ importlib_metadata==8.0.0
178
+ inflect==7.3.1
179
+ jaraco.collections==5.1.0
180
+ jaraco.context==5.3.0
181
+ jaraco.functools==4.0.1
182
+ jaraco.text==3.12.1
183
+ more-itertools==10.3.0
184
+ packaging==24.2
185
+ platformdirs==4.2.2
186
+ tomli==2.0.1
187
+ typeguard==4.3.0
188
+ typing_extensions==4.12.2
189
+ wheel==0.45.1
190
+ zipp==3.19.2
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-metadata.json ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36",
3
+ "python": "CPython 3.10.19",
4
+ "startedAt": "2026-01-12T05:32:56.070975Z",
5
+ "args": [
6
+ "--config_yaml",
7
+ "scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml",
8
+ "--framework.name",
9
+ "QwenOFT",
10
+ "--framework.qwenvl.base_vlm",
11
+ "/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b",
12
+ "--datasets.vla_data.data_root_dir",
13
+ "./playground/Datasets/OXE_LEROBOT",
14
+ "--datasets.vla_data.data_mix",
15
+ "bridge_rt_1",
16
+ "--datasets.vla_data.per_device_batch_size",
17
+ "8",
18
+ "--trainer.freeze_modules",
19
+ "--trainer.max_train_steps",
20
+ "100000",
21
+ "--trainer.save_interval",
22
+ "10000",
23
+ "--trainer.logging_frequency",
24
+ "50",
25
+ "--trainer.eval_interval",
26
+ "200",
27
+ "--run_root_dir",
28
+ "./Checkpoints",
29
+ "--run_id",
30
+ "qwen3vl_bridge_rt1_QwenOFT_0112_1323",
31
+ "--output_dir",
32
+ "./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323",
33
+ "--wandb.project",
34
+ "Qwen3VL_Bridge_RT1_QwenOFT",
35
+ "--wandb.entity",
36
+ "lookas"
37
+ ],
38
+ "program": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py",
39
+ "codePath": "starVLA/training/train_starvla.py",
40
+ "codePathLocal": "starVLA/training/train_starvla.py",
41
+ "git": {
42
+ "remote": "https://github.com/hilookas/starVLA_pickxiguapi",
43
+ "commit": "ab531aff5b27795879c61f67892330a616e9dbf0"
44
+ },
45
+ "email": "hilookas@gmail.com",
46
+ "root": "./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb",
47
+ "host": "g340-cd51-7700-770-343f-3fec-69bb",
48
+ "executable": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3",
49
+ "cpu_count": 90,
50
+ "cpu_count_logical": 180,
51
+ "gpu": "NVIDIA H20",
52
+ "gpu_count": 8,
53
+ "disk": {
54
+ "/": {
55
+ "total": "3779301580800",
56
+ "used": "159098298368"
57
+ }
58
+ },
59
+ "memory": {
60
+ "total": "2071188119552"
61
+ },
62
+ "gpu_nvidia": [
63
+ {
64
+ "name": "NVIDIA H20",
65
+ "memoryTotal": "102625181696",
66
+ "cudaCores": 9984,
67
+ "architecture": "Hopper",
68
+ "uuid": "GPU-f99bae5f-ffca-4972-6420-64c42ba64f22"
69
+ },
70
+ {
71
+ "name": "NVIDIA H20",
72
+ "memoryTotal": "102625181696",
73
+ "cudaCores": 9984,
74
+ "architecture": "Hopper",
75
+ "uuid": "GPU-a00709c9-6bdf-4011-64dc-95421da94ba4"
76
+ },
77
+ {
78
+ "name": "NVIDIA H20",
79
+ "memoryTotal": "102625181696",
80
+ "cudaCores": 9984,
81
+ "architecture": "Hopper",
82
+ "uuid": "GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5"
83
+ },
84
+ {
85
+ "name": "NVIDIA H20",
86
+ "memoryTotal": "102625181696",
87
+ "cudaCores": 9984,
88
+ "architecture": "Hopper",
89
+ "uuid": "GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9"
90
+ },
91
+ {
92
+ "name": "NVIDIA H20",
93
+ "memoryTotal": "102625181696",
94
+ "cudaCores": 9984,
95
+ "architecture": "Hopper",
96
+ "uuid": "GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218"
97
+ },
98
+ {
99
+ "name": "NVIDIA H20",
100
+ "memoryTotal": "102625181696",
101
+ "cudaCores": 9984,
102
+ "architecture": "Hopper",
103
+ "uuid": "GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde"
104
+ },
105
+ {
106
+ "name": "NVIDIA H20",
107
+ "memoryTotal": "102625181696",
108
+ "cudaCores": 9984,
109
+ "architecture": "Hopper",
110
+ "uuid": "GPU-4fa493fc-c408-182f-138e-bcc15c7f9138"
111
+ },
112
+ {
113
+ "name": "NVIDIA H20",
114
+ "memoryTotal": "102625181696",
115
+ "cudaCores": 9984,
116
+ "architecture": "Hopper",
117
+ "uuid": "GPU-16ef9185-6132-8620-ad2e-1f8920ded508"
118
+ }
119
+ ],
120
+ "cudaVersion": "12.4",
121
+ "writerId": "3h4xzexd9mhzcjwlbp7j0zfzyqq963et"
122
+ }
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"epoch":0.85,"data_time":0.7947496069828048,"mse_score":0.007877199777535029,"_wandb":{"runtime":121936},"action_dit_loss":0.0705610066652298,"model_time":0.9573145949980244,"learning_rate":5e-07,"_runtime":121936.771979222,"_timestamp":1.7683178622202885e+09,"_step":100000}
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug-internal.log ADDED
@@ -0,0 +1,78 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-12T13:33:02.374820947+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-12T13:33:03.82154982+08:00","level":"INFO","msg":"stream: created new stream","id":"ueywjhk5"}
3
+ {"time":"2026-01-12T13:33:03.821725323+08:00","level":"INFO","msg":"handler: started","stream_id":"ueywjhk5"}
4
+ {"time":"2026-01-12T13:33:03.846752186+08:00","level":"INFO","msg":"stream: started","id":"ueywjhk5"}
5
+ {"time":"2026-01-12T13:33:03.846770681+08:00","level":"INFO","msg":"writer: started","stream_id":"ueywjhk5"}
6
+ {"time":"2026-01-12T13:33:03.846770288+08:00","level":"INFO","msg":"sender: started","stream_id":"ueywjhk5"}
7
+ {"time":"2026-01-12T14:18:31.589248229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
8
+ {"time":"2026-01-12T14:39:00.33374833+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
9
+ {"time":"2026-01-12T14:45:00.196854395+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
10
+ {"time":"2026-01-12T15:30:49.608798424+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": net/http: request canceled while waiting for connection (Client.Timeout exceeded while awaiting headers)"}
11
+ {"time":"2026-01-12T15:58:15.168936649+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
12
+ {"time":"2026-01-12T16:32:15.169856477+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
13
+ {"time":"2026-01-12T16:32:28.120660769+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
14
+ {"time":"2026-01-12T18:52:15.110123119+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-12T20:25:15.093766297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
16
+ {"time":"2026-01-12T20:46:29.622105415+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": Gateway Timeout"}
17
+ {"time":"2026-01-12T20:57:51.676789447+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
18
+ {"time":"2026-01-12T21:34:03.873286543+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
19
+ {"time":"2026-01-12T21:57:16.546518785+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
20
+ {"time":"2026-01-12T22:29:15.864952943+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
21
+ {"time":"2026-01-12T22:36:13.618868987+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
22
+ {"time":"2026-01-12T22:36:31.272703076+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
23
+ {"time":"2026-01-13T00:17:45.174009838+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
24
+ {"time":"2026-01-13T00:17:57.789671331+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
25
+ {"time":"2026-01-13T00:18:45.160525879+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
26
+ {"time":"2026-01-13T01:22:18.006447633+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
27
+ {"time":"2026-01-13T02:03:21.340298852+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
28
+ {"time":"2026-01-13T03:04:34.668877357+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
29
+ {"time":"2026-01-13T03:04:47.661210297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
30
+ {"time":"2026-01-13T03:12:30.235091077+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
31
+ {"time":"2026-01-13T03:13:15.087092941+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
32
+ {"time":"2026-01-13T05:33:30.27306441+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
33
+ {"time":"2026-01-13T05:33:45.195585087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
34
+ {"time":"2026-01-13T05:34:15.047256192+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
35
+ {"time":"2026-01-13T06:34:30.165692234+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
36
+ {"time":"2026-01-13T06:34:42.845804108+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
37
+ {"time":"2026-01-13T06:34:59.430634519+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
38
+ {"time":"2026-01-13T06:35:45.090534347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
39
+ {"time":"2026-01-13T06:38:45.24671956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
40
+ {"time":"2026-01-13T06:40:00.085760676+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
41
+ {"time":"2026-01-13T06:40:30.253594276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
42
+ {"time":"2026-01-13T06:40:45.119737819+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
43
+ {"time":"2026-01-13T06:41:01.006178451+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
44
+ {"time":"2026-01-13T09:01:01.259781836+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
45
+ {"time":"2026-01-13T10:20:27.160154786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
46
+ {"time":"2026-01-13T11:23:00.198050425+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
47
+ {"time":"2026-01-13T11:24:00.137963825+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
48
+ {"time":"2026-01-13T11:41:16.643086394+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
49
+ {"time":"2026-01-13T12:21:36.803454674+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
50
+ {"time":"2026-01-13T12:29:23.122571501+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
51
+ {"time":"2026-01-13T12:59:15.208303261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
52
+ {"time":"2026-01-13T13:06:15.210877761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
53
+ {"time":"2026-01-13T13:06:27.856833979+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
54
+ {"time":"2026-01-13T13:09:06.355015154+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
55
+ {"time":"2026-01-13T13:40:00.126142378+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
56
+ {"time":"2026-01-13T13:46:32.168389695+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
57
+ {"time":"2026-01-13T13:48:15.081349554+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
58
+ {"time":"2026-01-13T13:57:00.197403381+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
59
+ {"time":"2026-01-13T15:57:25.317460174+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
60
+ {"time":"2026-01-13T15:59:46.726236225+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
61
+ {"time":"2026-01-13T16:09:46.448847236+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
62
+ {"time":"2026-01-13T16:58:01.095875797+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
63
+ {"time":"2026-01-13T17:24:10.021730043+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
64
+ {"time":"2026-01-13T18:27:15.075407399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
65
+ {"time":"2026-01-13T18:36:00.080917996+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
66
+ {"time":"2026-01-13T18:36:30.217018153+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
67
+ {"time":"2026-01-13T18:38:00.137187254+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
68
+ {"time":"2026-01-13T18:54:07.673379631+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
69
+ {"time":"2026-01-13T19:07:00.253334334+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
70
+ {"time":"2026-01-13T19:15:30.09514757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
71
+ {"time":"2026-01-13T20:25:51.505745758+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
72
+ {"time":"2026-01-13T21:59:51.560168548+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
73
+ {"time":"2026-01-13T23:25:27.580587803+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
74
+ {"time":"2026-01-13T23:25:28.86707285+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
75
+ {"time":"2026-01-13T23:25:28.876898999+08:00","level":"INFO","msg":"stream: closing","id":"ueywjhk5"}
76
+ {"time":"2026-01-13T23:25:28.876914442+08:00","level":"INFO","msg":"handler: closed","stream_id":"ueywjhk5"}
77
+ {"time":"2026-01-13T23:25:28.90868024+08:00","level":"INFO","msg":"sender: closed","stream_id":"ueywjhk5"}
78
+ {"time":"2026-01-13T23:25:28.90870897+08:00","level":"INFO","msg":"stream: closed","id":"ueywjhk5"}
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/run-ueywjhk5.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83487df0cfa0c26289ddf787c1fe8b54cbfef38f3aa069954fbf2e6d6d683736
3
+ size 112544775
qwen3vl_bridge_rt1_QwenOFT_0117_1748/config.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
4
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
5
+ data_mix: bridge_rt_1
6
+ data_root_dir: ./playground/Datasets/OXE_LEROBOT
7
+ dataset_py: lerobot_datasets
8
+ image_size:
9
+ - 224
10
+ - 224
11
+ per_device_batch_size: 8
12
+ video_backend: torchvision_av
13
+ framework:
14
+ action_model:
15
+ action_dim: 7
16
+ action_hidden_dim: 4096
17
+ action_model_type: DiT-B
18
+ future_action_window_size: 15
19
+ past_action_window_size: 0
20
+ name: QwenOFT
21
+ qwenvl:
22
+ base_vlm: /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
23
+ output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0117_1748
24
+ run_id: qwen3vl_bridge_rt1_QwenOFT_0117_1748
25
+ run_root_dir: ./Checkpoints
26
+ seed: 42
27
+ trainer:
28
+ eval_interval: 200
29
+ freeze_modules: true
30
+ gradient_accumulation_steps: 1
31
+ gradient_clipping: 1.0
32
+ is_resume: false
33
+ learning_rate:
34
+ action_model: 0.0001
35
+ base: 1.0e-05
36
+ qwen_vl_interface: 1.0e-05
37
+ logging_frequency: 50
38
+ lr_scheduler_type: cosine_with_min_lr
39
+ max_train_steps: 100000
40
+ num_warmup_steps: 10000
41
+ optimizer:
42
+ betas:
43
+ - 0.9
44
+ - 0.95
45
+ eps: 1.0e-08
46
+ weight_decay: 1.0e-08
47
+ save_interval: 10000
48
+ scheduler_specific_kwargs:
49
+ min_lr: 5.0e-07
50
+ wandb_entity: lookas
51
+ wandb_project: Qwen3VL_Bridge_RT1_OFT
qwen3vl_bridge_rt1_QwenOFT_0117_1748/dataset_statistics.json ADDED
@@ -0,0 +1,264 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "oxe_bridge": {
3
+ "action": {
4
+ "mean": [
5
+ 0.00011365935642970726,
6
+ 6.556110747624189e-05,
7
+ -6.320965621853247e-05,
8
+ -7.205353176686913e-05,
9
+ -0.00019515302847139537,
10
+ 0.0001203166029881686,
11
+ 0.28829458355903625
12
+ ],
13
+ "std": [
14
+ 0.006909770731857718,
15
+ 0.009684093232852218,
16
+ 0.00896290498528129,
17
+ 0.020121052930683073,
18
+ 0.021582655517295487,
19
+ 0.054723342223346974,
20
+ 0.4543627821514982
21
+ ],
22
+ "max": [
23
+ 0.41691166162490845,
24
+ 0.25864794850349426,
25
+ 0.21218234300613403,
26
+ 3.122201919555664,
27
+ 1.8618112802505493,
28
+ 6.272472858428955,
29
+ 1.0
30
+ ],
31
+ "min": [
32
+ -0.4007510244846344,
33
+ -0.13874775171279907,
34
+ -0.22553899884223938,
35
+ -3.2010786533355713,
36
+ -1.8618112802505493,
37
+ -6.279075622558594,
38
+ 0.0
39
+ ],
40
+ "q01": [
41
+ -0.02875255048274994,
42
+ -0.04170213546603918,
43
+ -0.026096721179783344,
44
+ -0.08052874729037285,
45
+ -0.09249906800687313,
46
+ -0.20738555490970612,
47
+ 0.0
48
+ ],
49
+ "q99": [
50
+ 0.028306663036346436,
51
+ 0.04089853074401617,
52
+ 0.0401805154979229,
53
+ 0.08173403143882751,
54
+ 0.07760760560631752,
55
+ 0.2038465365767479,
56
+ 1.0
57
+ ],
58
+ "mask": [
59
+ true,
60
+ true,
61
+ true,
62
+ true,
63
+ true,
64
+ true,
65
+ false
66
+ ]
67
+ },
68
+ "state": {
69
+ "mean": [
70
+ 0.15471743047237396,
71
+ 0.015362550504505634,
72
+ 0.03222028166055679,
73
+ 0.0032453201711177826,
74
+ -0.038600146770477295,
75
+ 0.05382946878671646,
76
+ 0.0,
77
+ 0.35406652092933655
78
+ ],
79
+ "std": [
80
+ 0.1605359274864927,
81
+ 0.06677912092232112,
82
+ 0.048657150951527554,
83
+ 0.09275336958940797,
84
+ 0.12566984746914736,
85
+ 0.41222738578801793,
86
+ 0.0,
87
+ 0.4330223535305803
88
+ ],
89
+ "max": [
90
+ 0.5862360596656799,
91
+ 0.4034728705883026,
92
+ 0.3568263053894043,
93
+ 1.3517684936523438,
94
+ 1.570796251296997,
95
+ 3.141204357147217,
96
+ 0.0,
97
+ 1.1121242046356201
98
+ ],
99
+ "min": [
100
+ -0.04167502000927925,
101
+ -0.3563207685947418,
102
+ -0.15537554025650024,
103
+ -3.141592502593994,
104
+ -1.4992541074752808,
105
+ -3.14153790473938,
106
+ 0.0,
107
+ 0.04637829214334488
108
+ ],
109
+ "q01": [
110
+ 0.17102622985839844,
111
+ -0.1698118858039379,
112
+ -0.055632163770496845,
113
+ -0.36493172496557236,
114
+ -0.541871190071106,
115
+ -1.354275494813919,
116
+ 0.0,
117
+ 0.052190229296684265
118
+ ],
119
+ "q99": [
120
+ 0.45322076976299286,
121
+ 0.2354845181107521,
122
+ 0.19489620998501778,
123
+ 0.3780156075954437,
124
+ 0.27568644285202026,
125
+ 1.8500566184520721,
126
+ 0.0,
127
+ 1.0105689764022827
128
+ ]
129
+ },
130
+ "num_transitions": 1305714,
131
+ "num_trajectories": 53192
132
+ },
133
+ "oxe_rt1": {
134
+ "action": {
135
+ "mean": [
136
+ 0.003493750700727105,
137
+ 0.003132961690425873,
138
+ -0.0063125672750175,
139
+ 0.02166595682501793,
140
+ -0.0028780836146324873,
141
+ 0.0004565489653032273,
142
+ 0.26771023869514465
143
+ ],
144
+ "std": [
145
+ 0.049065014465362655,
146
+ 0.04229853739828572,
147
+ 0.05237628880142378,
148
+ 0.1124860236500875,
149
+ 0.09312952783816872,
150
+ 0.10319098309601091,
151
+ 0.4418448662622395
152
+ ],
153
+ "max": [
154
+ 2.9984593391418457,
155
+ 22.09052848815918,
156
+ 2.7507524490356445,
157
+ 1.570636510848999,
158
+ 1.5321086645126343,
159
+ 1.5691522359848022,
160
+ 1.0
161
+ ],
162
+ "min": [
163
+ -2.0204520225524902,
164
+ -5.497899532318115,
165
+ -2.031663417816162,
166
+ -1.569917917251587,
167
+ -1.569892168045044,
168
+ -1.570419430732727,
169
+ 0.0
170
+ ],
171
+ "q01": [
172
+ -0.22453527510166169,
173
+ -0.14820013284683228,
174
+ -0.231589707583189,
175
+ -0.3517994859814644,
176
+ -0.4193011274933815,
177
+ -0.43643461108207704,
178
+ 0.0
179
+ ],
180
+ "q99": [
181
+ 0.17824687153100965,
182
+ 0.14938379630446405,
183
+ 0.21842354819178575,
184
+ 0.5892666035890578,
185
+ 0.35272657424211445,
186
+ 0.44796681255102094,
187
+ 1.0
188
+ ],
189
+ "mask": [
190
+ true,
191
+ true,
192
+ true,
193
+ true,
194
+ true,
195
+ true,
196
+ false
197
+ ]
198
+ },
199
+ "state": {
200
+ "mean": [
201
+ 0.2799473702907562,
202
+ -0.04167069122195244,
203
+ 0.38854750990867615,
204
+ 0.21306729316711426,
205
+ -0.12402277439832687,
206
+ 0.24756911396980286,
207
+ 0.046330634504556656,
208
+ 0.10487449914216995
209
+ ],
210
+ "std": [
211
+ 0.29342642876909925,
212
+ 0.09174024655686211,
213
+ 0.42569508885539115,
214
+ 0.38616252611341306,
215
+ 0.38314586427420927,
216
+ 0.44433568806919804,
217
+ 0.1263927443679382,
218
+ 0.22122596673781084
219
+ ],
220
+ "max": [
221
+ 1.0534898042678833,
222
+ 0.48018959164619446,
223
+ 1.6896663904190063,
224
+ 1.0,
225
+ 0.9999993443489075,
226
+ 0.9999874830245972,
227
+ 0.9554369449615479,
228
+ 0.9914546012878418
229
+ ],
230
+ "min": [
231
+ -0.4436439275741577,
232
+ -0.9970501065254211,
233
+ -0.006579156965017319,
234
+ 0.0,
235
+ -0.8643477559089661,
236
+ -0.7079970240592957,
237
+ -0.7688722014427185,
238
+ -0.4999994933605194
239
+ ],
240
+ "q01": [
241
+ 0.32481380939483645,
242
+ -0.28334290891885755,
243
+ 0.14107070609927178,
244
+ 0.0,
245
+ -0.686474204659462,
246
+ -0.6808923494815826,
247
+ -0.36045596331357954,
248
+ -0.454380963742733
249
+ ],
250
+ "q99": [
251
+ 0.8750156319141384,
252
+ 0.21247054174542404,
253
+ 1.0727112340927123,
254
+ 1.0,
255
+ 0.9377871316671368,
256
+ 0.9563051050901409,
257
+ 0.45990042358636823,
258
+ 0.7216041100025177
259
+ ]
260
+ },
261
+ "num_transitions": 3786152,
262
+ "num_trajectories": 87212
263
+ }
264
+ }
qwen3vl_bridge_rt1_QwenOFT_0117_1748/run_qwen3vl_bridge_rt1_qwen_oft.sh ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Framework_name=QwenOFT
2
+ dit_type="DiT-B"
3
+ freeze_module_list='' # fully FT, e.g., freeze_module_list=""
4
+ data_mix=bridge_rt_1
5
+
6
+ ## Modify below paths before running ##
7
+ date_time=$(date +%m%d_%H%M)
8
+ config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
9
+ base_vlm=/home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
10
+ data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
11
+ run_root_dir=./Checkpoints
12
+ run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
13
+ batch_size=8
14
+ wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
15
+ wandb_entity=lookas
16
+
17
+ # export WANDB_MODE=disabled
18
+
19
+ output_dir=${run_root_dir}/${run_id}
20
+ mkdir -p ${output_dir}
21
+ cp $0 ${output_dir}/
22
+
23
+
24
+ accelerate launch --main_process_port 12773 \
25
+ --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
26
+ --num_processes 8 \
27
+ starVLA/training/train_starvla.py \
28
+ --config_yaml ${config_yaml} \
29
+ --framework.name ${Framework_name} \
30
+ --framework.qwenvl.base_vlm ${base_vlm} \
31
+ --datasets.vla_data.data_root_dir ${data_root_dir}\
32
+ --datasets.vla_data.data_mix ${data_mix} \
33
+ --datasets.vla_data.per_device_batch_size ${batch_size} \
34
+ --trainer.freeze_modules ${freeze_module_list} \
35
+ --trainer.max_train_steps 100000 \
36
+ --trainer.save_interval 10000 \
37
+ --trainer.logging_frequency 50 \
38
+ --trainer.eval_interval 200 \
39
+ --run_root_dir ${run_root_dir} \
40
+ --run_id ${run_id} \
41
+ --output_dir ${output_dir} \
42
+ --wandb.project ${wandb_project} \
43
+ --wandb.entity ${wandb_entity}
44
+
45
+
46
+ # multi-node launch example
47
+
48
+ # accelerate launch \
49
+ # --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
50
+ # --main_process_ip $MASTER_ADDR \
51
+ # --main_process_port $MASTER_PORT \
52
+ # --machine_rank $SLURM_PROCID \
53
+ # --num_machines $SLURM_NNODES \
54
+ # --num_processes=${TOTAL_GPUS} \
55
+ # starVLA/training/train_starvla.py \
56
+ # --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
57
+ # --framework.framework_py QwenGR00T \
58
+ # --framework.qwenvl.base_vlm microsoft/Florence-2-large \
59
+ # --run_root_dir ${run_root_dir} \
60
+ # --run_id ${run_id} \
61
+ # --wandb_project your_project \
62
+ # --wandb_entity your_name
qwen3vl_bridge_rt1_QwenOFT_0117_1748/summary.jsonl ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {"steps": 10000}
2
+ {"steps": 20000}
3
+ {"steps": 30000}
4
+ {"steps": 40000}
5
+ {"steps": 50000}
6
+ {"steps": 60000}
7
+ {"steps": 70000}
8
+ {"steps": 80000}
9
+ {"steps": 90000}
10
+ {"steps": 100000}
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug-internal.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-01-17T18:05:32.919256759+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
2
+ {"time":"2026-01-17T18:05:36.622867047+08:00","level":"INFO","msg":"stream: created new stream","id":"rqrn3qyr"}
3
+ {"time":"2026-01-17T18:05:36.623047484+08:00","level":"INFO","msg":"handler: started","stream_id":"rqrn3qyr"}
4
+ {"time":"2026-01-17T18:05:36.648380876+08:00","level":"INFO","msg":"stream: started","id":"rqrn3qyr"}
5
+ {"time":"2026-01-17T18:05:36.64839606+08:00","level":"INFO","msg":"writer: started","stream_id":"rqrn3qyr"}
6
+ {"time":"2026-01-17T18:05:36.648398878+08:00","level":"INFO","msg":"sender: started","stream_id":"rqrn3qyr"}
7
+ {"time":"2026-01-17T22:37:34.86356798+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:52928->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
8
+ {"time":"2026-01-17T22:54:18.423710102+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
9
+ {"time":"2026-01-18T00:12:50.883820737+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
10
+ {"time":"2026-01-18T02:09:32.843274738+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:52904->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
11
+ {"time":"2026-01-18T13:00:31.504000712+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:43174->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
12
+ {"time":"2026-01-18T15:24:38.642505893+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
13
+ {"time":"2026-01-18T19:01:56.523537868+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
14
+ {"time":"2026-01-18T20:33:30.03545379+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
15
+ {"time":"2026-01-18T20:34:13.086658278+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
16
+ {"time":"2026-01-18T21:46:54.335541764+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:53174->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
17
+ {"time":"2026-01-18T21:47:09.229423294+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
18
+ {"time":"2026-01-18T23:52:58.941500301+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
19
+ {"time":"2026-01-19T02:13:36.852336596+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
20
+ {"time":"2026-01-19T02:28:43.986696739+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
21
+ {"time":"2026-01-19T02:28:45.179352006+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
22
+ {"time":"2026-01-19T02:28:45.189009251+08:00","level":"INFO","msg":"stream: closing","id":"rqrn3qyr"}
23
+ {"time":"2026-01-19T02:28:45.189020364+08:00","level":"INFO","msg":"handler: closed","stream_id":"rqrn3qyr"}
24
+ {"time":"2026-01-19T02:28:45.20863216+08:00","level":"INFO","msg":"sender: closed","stream_id":"rqrn3qyr"}
25
+ {"time":"2026-01-19T02:28:45.208650774+08:00","level":"INFO","msg":"stream: closed","id":"rqrn3qyr"}
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug.log ADDED
File without changes
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/config.yaml ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.23.1
4
+ e:
5
+ 5cfcqp03otctf4fyn22usch179j8xvxz:
6
+ args:
7
+ - --config_yaml
8
+ - scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
9
+ - --framework.name
10
+ - QwenOFT
11
+ - --framework.qwenvl.base_vlm
12
+ - /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
13
+ - --datasets.vla_data.data_root_dir
14
+ - ./playground/Datasets/OXE_LEROBOT
15
+ - --datasets.vla_data.data_mix
16
+ - bridge_rt_1
17
+ - --datasets.vla_data.per_device_batch_size
18
+ - "8"
19
+ - --trainer.freeze_modules
20
+ - --trainer.max_train_steps
21
+ - "100000"
22
+ - --trainer.save_interval
23
+ - "10000"
24
+ - --trainer.logging_frequency
25
+ - "50"
26
+ - --trainer.eval_interval
27
+ - "200"
28
+ - --run_root_dir
29
+ - ./Checkpoints
30
+ - --run_id
31
+ - qwen3vl_bridge_rt1_QwenOFT_0117_1748
32
+ - --output_dir
33
+ - ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0117_1748
34
+ - --wandb.project
35
+ - Qwen3VL_Bridge_RT1_QwenOFT
36
+ - --wandb.entity
37
+ - lookas
38
+ codePath: starVLA/training/train_starvla.py
39
+ codePathLocal: starVLA/training/train_starvla.py
40
+ cpu_count: 90
41
+ cpu_count_logical: 180
42
+ cudaVersion: "12.4"
43
+ disk:
44
+ /:
45
+ total: "3779301580800"
46
+ used: "151636508672"
47
+ email: hilookas@gmail.com
48
+ executable: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3
49
+ git:
50
+ commit: ab531aff5b27795879c61f67892330a616e9dbf0
51
+ remote: https://github.com/hilookas/starVLA_pickxiguapi
52
+ gpu: NVIDIA H20
53
+ gpu_count: 8
54
+ gpu_nvidia:
55
+ - architecture: Hopper
56
+ cudaCores: 9984
57
+ memoryTotal: "102625181696"
58
+ name: NVIDIA H20
59
+ uuid: GPU-fb4370de-60ba-70ca-eeca-022c40ee5dc2
60
+ - architecture: Hopper
61
+ cudaCores: 9984
62
+ memoryTotal: "102625181696"
63
+ name: NVIDIA H20
64
+ uuid: GPU-2b87ce45-0783-3787-00a5-678fab82dff7
65
+ - architecture: Hopper
66
+ cudaCores: 9984
67
+ memoryTotal: "102625181696"
68
+ name: NVIDIA H20
69
+ uuid: GPU-f37740ca-0c96-508b-6014-0c7c5717ce90
70
+ - architecture: Hopper
71
+ cudaCores: 9984
72
+ memoryTotal: "102625181696"
73
+ name: NVIDIA H20
74
+ uuid: GPU-f59773d6-f9c1-34dc-06fa-92979c9f3c64
75
+ - architecture: Hopper
76
+ cudaCores: 9984
77
+ memoryTotal: "102625181696"
78
+ name: NVIDIA H20
79
+ uuid: GPU-993ec1cf-6953-aff2-fd04-2f116a004be8
80
+ - architecture: Hopper
81
+ cudaCores: 9984
82
+ memoryTotal: "102625181696"
83
+ name: NVIDIA H20
84
+ uuid: GPU-c1ddbd85-e0d5-97e8-cc7e-3bb01759b504
85
+ - architecture: Hopper
86
+ cudaCores: 9984
87
+ memoryTotal: "102625181696"
88
+ name: NVIDIA H20
89
+ uuid: GPU-e8bab208-8550-dbd6-9630-08f32d2f4fce
90
+ - architecture: Hopper
91
+ cudaCores: 9984
92
+ memoryTotal: "102625181696"
93
+ name: NVIDIA H20
94
+ uuid: GPU-8be9c3c0-cd15-3534-0dbd-de2c1d6aaf1d
95
+ host: g340-cd51-7700-4fb-cd4a-6d4e-969e
96
+ memory:
97
+ total: "2071188119552"
98
+ os: Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36
99
+ program: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py
100
+ python: CPython 3.10.19
101
+ root: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb
102
+ startedAt: "2026-01-17T10:05:26.699051Z"
103
+ writerId: 5cfcqp03otctf4fyn22usch179j8xvxz
104
+ m: []
105
+ python_version: 3.10.19
106
+ t:
107
+ "1":
108
+ - 1
109
+ - 11
110
+ - 41
111
+ - 49
112
+ - 63
113
+ - 71
114
+ - 80
115
+ - 83
116
+ "2":
117
+ - 1
118
+ - 11
119
+ - 41
120
+ - 49
121
+ - 63
122
+ - 71
123
+ - 80
124
+ - 83
125
+ "3":
126
+ - 2
127
+ - 13
128
+ - 61
129
+ "4": 3.10.19
130
+ "5": 0.23.1
131
+ "6": 4.57.3
132
+ "12": 0.23.1
133
+ "13": linux-x86_64
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/output.log ADDED
The diff for this file is too large to render. See raw diff