Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +4 -0
- .gitignore +1 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/config.yaml +71 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/dataset_statistics.json +264 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/run_qwen3vl_bridge_rt1_qwen_gr00t.sh +62 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/summary.jsonl +4 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug-internal.log +18 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/output.log +0 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/requirements.txt +190 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/wandb-metadata.json +122 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug-internal.log +18 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/run-xgfaxrjd.wandb +3 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/config.yaml +71 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/dataset_statistics.json +264 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/run_qwen3vl_bridge_rt1_qwen_gr00t.sh +62 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/summary.jsonl +10 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug-internal.log +89 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/config.yaml +133 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/output.log +0 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/requirements.txt +190 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-metadata.json +122 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-summary.json +1 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug-internal.log +89 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/run-xbap43rk.wandb +3 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/config.yaml +51 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/dataset_statistics.json +264 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/run_qwen3vl_bridge_rt1_qwen_oft.sh +62 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/summary.jsonl +10 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug-internal.log +78 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/config.yaml +133 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/output.log +0 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/requirements.txt +190 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-metadata.json +122 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-summary.json +1 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug-internal.log +78 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/run-ueywjhk5.wandb +3 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/config.yaml +51 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/dataset_statistics.json +264 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/run_qwen3vl_bridge_rt1_qwen_oft.sh +62 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/summary.jsonl +10 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug-internal.log +25 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug.log +0 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/config.yaml +133 -0
- qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/output.log +0 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/run-xgfaxrjd.wandb filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/run-xbap43rk.wandb filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/run-ueywjhk5.wandb filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/run-rqrn3qyr.wandb filter=lfs diff=lfs merge=lfs -text
|
.gitignore
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
wandb
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/config.yaml
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
datasets:
|
| 2 |
+
vla_data:
|
| 3 |
+
CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
|
| 4 |
+
Locate their bounding boxes in [x1,y1,x2,y2] format.
|
| 5 |
+
data_mix: bridge_rt_1
|
| 6 |
+
data_root_dir: ./playground/Datasets/OXE_LEROBOT
|
| 7 |
+
dataset_py: lerobot_datasets
|
| 8 |
+
image_size:
|
| 9 |
+
- 224
|
| 10 |
+
- 224
|
| 11 |
+
per_device_batch_size: 8
|
| 12 |
+
video_backend: torchvision_av
|
| 13 |
+
framework:
|
| 14 |
+
action_model:
|
| 15 |
+
action_dim: 7
|
| 16 |
+
action_horizon: 16
|
| 17 |
+
action_model_type: DiT-B
|
| 18 |
+
add_pos_embed: true
|
| 19 |
+
diffusion_model_cfg:
|
| 20 |
+
cross_attention_dim: 4096
|
| 21 |
+
dropout: 0.2
|
| 22 |
+
final_dropout: true
|
| 23 |
+
interleave_self_attention: true
|
| 24 |
+
norm_type: ada_norm
|
| 25 |
+
num_layers: 16
|
| 26 |
+
output_dim: 1024
|
| 27 |
+
positional_embeddings: null
|
| 28 |
+
future_action_window_size: 15
|
| 29 |
+
hidden_size: 1024
|
| 30 |
+
max_seq_len: 1024
|
| 31 |
+
noise_beta_alpha: 1.5
|
| 32 |
+
noise_beta_beta: 1.0
|
| 33 |
+
noise_s: 0.999
|
| 34 |
+
num_inference_timesteps: 4
|
| 35 |
+
num_target_vision_tokens: 32
|
| 36 |
+
num_timestep_buckets: 1000
|
| 37 |
+
past_action_window_size: 0
|
| 38 |
+
state_dim: 7
|
| 39 |
+
name: QwenGR00T
|
| 40 |
+
qwenvl:
|
| 41 |
+
base_vlm: /home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
|
| 42 |
+
output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0112_1323
|
| 43 |
+
run_id: qwen3vl_bridge_rt1_QwenGR00T_0112_1323
|
| 44 |
+
run_root_dir: ./Checkpoints
|
| 45 |
+
seed: 42
|
| 46 |
+
trainer:
|
| 47 |
+
eval_interval: 200
|
| 48 |
+
freeze_modules: true
|
| 49 |
+
gradient_accumulation_steps: 1
|
| 50 |
+
gradient_clipping: 1.0
|
| 51 |
+
is_resume: false
|
| 52 |
+
learning_rate:
|
| 53 |
+
action_model: 0.0001
|
| 54 |
+
base: 1.0e-05
|
| 55 |
+
qwen_vl_interface: 1.0e-05
|
| 56 |
+
logging_frequency: 50
|
| 57 |
+
lr_scheduler_type: cosine_with_min_lr
|
| 58 |
+
max_train_steps: 100000
|
| 59 |
+
num_warmup_steps: 10000
|
| 60 |
+
optimizer:
|
| 61 |
+
betas:
|
| 62 |
+
- 0.9
|
| 63 |
+
- 0.95
|
| 64 |
+
eps: 1.0e-08
|
| 65 |
+
weight_decay: 1.0e-08
|
| 66 |
+
repeated_diffusion_steps: 4
|
| 67 |
+
save_interval: 10000
|
| 68 |
+
scheduler_specific_kwargs:
|
| 69 |
+
min_lr: 5.0e-07
|
| 70 |
+
wandb_entity: lookas
|
| 71 |
+
wandb_project: Qwen3VL_Bridge_RT1_GR00T
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/dataset_statistics.json
ADDED
|
@@ -0,0 +1,264 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"oxe_bridge": {
|
| 3 |
+
"action": {
|
| 4 |
+
"mean": [
|
| 5 |
+
0.00011365935642970726,
|
| 6 |
+
6.556110747624189e-05,
|
| 7 |
+
-6.320965621853247e-05,
|
| 8 |
+
-7.205353176686913e-05,
|
| 9 |
+
-0.00019515302847139537,
|
| 10 |
+
0.0001203166029881686,
|
| 11 |
+
0.28829458355903625
|
| 12 |
+
],
|
| 13 |
+
"std": [
|
| 14 |
+
0.006909770731857718,
|
| 15 |
+
0.009684093232852218,
|
| 16 |
+
0.00896290498528129,
|
| 17 |
+
0.020121052930683073,
|
| 18 |
+
0.021582655517295487,
|
| 19 |
+
0.054723342223346974,
|
| 20 |
+
0.4543627821514982
|
| 21 |
+
],
|
| 22 |
+
"max": [
|
| 23 |
+
0.41691166162490845,
|
| 24 |
+
0.25864794850349426,
|
| 25 |
+
0.21218234300613403,
|
| 26 |
+
3.122201919555664,
|
| 27 |
+
1.8618112802505493,
|
| 28 |
+
6.272472858428955,
|
| 29 |
+
1.0
|
| 30 |
+
],
|
| 31 |
+
"min": [
|
| 32 |
+
-0.4007510244846344,
|
| 33 |
+
-0.13874775171279907,
|
| 34 |
+
-0.22553899884223938,
|
| 35 |
+
-3.2010786533355713,
|
| 36 |
+
-1.8618112802505493,
|
| 37 |
+
-6.279075622558594,
|
| 38 |
+
0.0
|
| 39 |
+
],
|
| 40 |
+
"q01": [
|
| 41 |
+
-0.02875255048274994,
|
| 42 |
+
-0.04170213546603918,
|
| 43 |
+
-0.026096721179783344,
|
| 44 |
+
-0.08052874729037285,
|
| 45 |
+
-0.09249906800687313,
|
| 46 |
+
-0.20738555490970612,
|
| 47 |
+
0.0
|
| 48 |
+
],
|
| 49 |
+
"q99": [
|
| 50 |
+
0.028306663036346436,
|
| 51 |
+
0.04089853074401617,
|
| 52 |
+
0.0401805154979229,
|
| 53 |
+
0.08173403143882751,
|
| 54 |
+
0.07760760560631752,
|
| 55 |
+
0.2038465365767479,
|
| 56 |
+
1.0
|
| 57 |
+
],
|
| 58 |
+
"mask": [
|
| 59 |
+
true,
|
| 60 |
+
true,
|
| 61 |
+
true,
|
| 62 |
+
true,
|
| 63 |
+
true,
|
| 64 |
+
true,
|
| 65 |
+
false
|
| 66 |
+
]
|
| 67 |
+
},
|
| 68 |
+
"state": {
|
| 69 |
+
"mean": [
|
| 70 |
+
0.15471743047237396,
|
| 71 |
+
0.015362550504505634,
|
| 72 |
+
0.03222028166055679,
|
| 73 |
+
0.0032453201711177826,
|
| 74 |
+
-0.038600146770477295,
|
| 75 |
+
0.05382946878671646,
|
| 76 |
+
0.0,
|
| 77 |
+
0.35406652092933655
|
| 78 |
+
],
|
| 79 |
+
"std": [
|
| 80 |
+
0.1605359274864927,
|
| 81 |
+
0.06677912092232112,
|
| 82 |
+
0.048657150951527554,
|
| 83 |
+
0.09275336958940797,
|
| 84 |
+
0.12566984746914736,
|
| 85 |
+
0.41222738578801793,
|
| 86 |
+
0.0,
|
| 87 |
+
0.4330223535305803
|
| 88 |
+
],
|
| 89 |
+
"max": [
|
| 90 |
+
0.5862360596656799,
|
| 91 |
+
0.4034728705883026,
|
| 92 |
+
0.3568263053894043,
|
| 93 |
+
1.3517684936523438,
|
| 94 |
+
1.570796251296997,
|
| 95 |
+
3.141204357147217,
|
| 96 |
+
0.0,
|
| 97 |
+
1.1121242046356201
|
| 98 |
+
],
|
| 99 |
+
"min": [
|
| 100 |
+
-0.04167502000927925,
|
| 101 |
+
-0.3563207685947418,
|
| 102 |
+
-0.15537554025650024,
|
| 103 |
+
-3.141592502593994,
|
| 104 |
+
-1.4992541074752808,
|
| 105 |
+
-3.14153790473938,
|
| 106 |
+
0.0,
|
| 107 |
+
0.04637829214334488
|
| 108 |
+
],
|
| 109 |
+
"q01": [
|
| 110 |
+
0.17102622985839844,
|
| 111 |
+
-0.1698118858039379,
|
| 112 |
+
-0.055632163770496845,
|
| 113 |
+
-0.36493172496557236,
|
| 114 |
+
-0.541871190071106,
|
| 115 |
+
-1.354275494813919,
|
| 116 |
+
0.0,
|
| 117 |
+
0.052190229296684265
|
| 118 |
+
],
|
| 119 |
+
"q99": [
|
| 120 |
+
0.45322076976299286,
|
| 121 |
+
0.2354845181107521,
|
| 122 |
+
0.19489620998501778,
|
| 123 |
+
0.3780156075954437,
|
| 124 |
+
0.27568644285202026,
|
| 125 |
+
1.8500566184520721,
|
| 126 |
+
0.0,
|
| 127 |
+
1.0105689764022827
|
| 128 |
+
]
|
| 129 |
+
},
|
| 130 |
+
"num_transitions": 1305714,
|
| 131 |
+
"num_trajectories": 53192
|
| 132 |
+
},
|
| 133 |
+
"oxe_rt1": {
|
| 134 |
+
"action": {
|
| 135 |
+
"mean": [
|
| 136 |
+
0.003493750700727105,
|
| 137 |
+
0.003132961690425873,
|
| 138 |
+
-0.0063125672750175,
|
| 139 |
+
0.02166595682501793,
|
| 140 |
+
-0.0028780836146324873,
|
| 141 |
+
0.0004565489653032273,
|
| 142 |
+
0.26771023869514465
|
| 143 |
+
],
|
| 144 |
+
"std": [
|
| 145 |
+
0.049065014465362655,
|
| 146 |
+
0.04229853739828572,
|
| 147 |
+
0.05237628880142378,
|
| 148 |
+
0.1124860236500875,
|
| 149 |
+
0.09312952783816872,
|
| 150 |
+
0.10319098309601091,
|
| 151 |
+
0.4418448662622395
|
| 152 |
+
],
|
| 153 |
+
"max": [
|
| 154 |
+
2.9984593391418457,
|
| 155 |
+
22.09052848815918,
|
| 156 |
+
2.7507524490356445,
|
| 157 |
+
1.570636510848999,
|
| 158 |
+
1.5321086645126343,
|
| 159 |
+
1.5691522359848022,
|
| 160 |
+
1.0
|
| 161 |
+
],
|
| 162 |
+
"min": [
|
| 163 |
+
-2.0204520225524902,
|
| 164 |
+
-5.497899532318115,
|
| 165 |
+
-2.031663417816162,
|
| 166 |
+
-1.569917917251587,
|
| 167 |
+
-1.569892168045044,
|
| 168 |
+
-1.570419430732727,
|
| 169 |
+
0.0
|
| 170 |
+
],
|
| 171 |
+
"q01": [
|
| 172 |
+
-0.22453527510166169,
|
| 173 |
+
-0.14820013284683228,
|
| 174 |
+
-0.231589707583189,
|
| 175 |
+
-0.3517994859814644,
|
| 176 |
+
-0.4193011274933815,
|
| 177 |
+
-0.43643461108207704,
|
| 178 |
+
0.0
|
| 179 |
+
],
|
| 180 |
+
"q99": [
|
| 181 |
+
0.17824687153100965,
|
| 182 |
+
0.14938379630446405,
|
| 183 |
+
0.21842354819178575,
|
| 184 |
+
0.5892666035890578,
|
| 185 |
+
0.35272657424211445,
|
| 186 |
+
0.44796681255102094,
|
| 187 |
+
1.0
|
| 188 |
+
],
|
| 189 |
+
"mask": [
|
| 190 |
+
true,
|
| 191 |
+
true,
|
| 192 |
+
true,
|
| 193 |
+
true,
|
| 194 |
+
true,
|
| 195 |
+
true,
|
| 196 |
+
false
|
| 197 |
+
]
|
| 198 |
+
},
|
| 199 |
+
"state": {
|
| 200 |
+
"mean": [
|
| 201 |
+
0.2799473702907562,
|
| 202 |
+
-0.04167069122195244,
|
| 203 |
+
0.38854750990867615,
|
| 204 |
+
0.21306729316711426,
|
| 205 |
+
-0.12402277439832687,
|
| 206 |
+
0.24756911396980286,
|
| 207 |
+
0.046330634504556656,
|
| 208 |
+
0.10487449914216995
|
| 209 |
+
],
|
| 210 |
+
"std": [
|
| 211 |
+
0.29342642876909925,
|
| 212 |
+
0.09174024655686211,
|
| 213 |
+
0.42569508885539115,
|
| 214 |
+
0.38616252611341306,
|
| 215 |
+
0.38314586427420927,
|
| 216 |
+
0.44433568806919804,
|
| 217 |
+
0.1263927443679382,
|
| 218 |
+
0.22122596673781084
|
| 219 |
+
],
|
| 220 |
+
"max": [
|
| 221 |
+
1.0534898042678833,
|
| 222 |
+
0.48018959164619446,
|
| 223 |
+
1.6896663904190063,
|
| 224 |
+
1.0,
|
| 225 |
+
0.9999993443489075,
|
| 226 |
+
0.9999874830245972,
|
| 227 |
+
0.9554369449615479,
|
| 228 |
+
0.9914546012878418
|
| 229 |
+
],
|
| 230 |
+
"min": [
|
| 231 |
+
-0.4436439275741577,
|
| 232 |
+
-0.9970501065254211,
|
| 233 |
+
-0.006579156965017319,
|
| 234 |
+
0.0,
|
| 235 |
+
-0.8643477559089661,
|
| 236 |
+
-0.7079970240592957,
|
| 237 |
+
-0.7688722014427185,
|
| 238 |
+
-0.4999994933605194
|
| 239 |
+
],
|
| 240 |
+
"q01": [
|
| 241 |
+
0.32481380939483645,
|
| 242 |
+
-0.28334290891885755,
|
| 243 |
+
0.14107070609927178,
|
| 244 |
+
0.0,
|
| 245 |
+
-0.686474204659462,
|
| 246 |
+
-0.6808923494815826,
|
| 247 |
+
-0.36045596331357954,
|
| 248 |
+
-0.454380963742733
|
| 249 |
+
],
|
| 250 |
+
"q99": [
|
| 251 |
+
0.8750156319141384,
|
| 252 |
+
0.21247054174542404,
|
| 253 |
+
1.0727112340927123,
|
| 254 |
+
1.0,
|
| 255 |
+
0.9377871316671368,
|
| 256 |
+
0.9563051050901409,
|
| 257 |
+
0.45990042358636823,
|
| 258 |
+
0.7216041100025177
|
| 259 |
+
]
|
| 260 |
+
},
|
| 261 |
+
"num_transitions": 3786152,
|
| 262 |
+
"num_trajectories": 87212
|
| 263 |
+
}
|
| 264 |
+
}
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/run_qwen3vl_bridge_rt1_qwen_gr00t.sh
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Framework_name=QwenGR00T
|
| 2 |
+
dit_type="DiT-B"
|
| 3 |
+
freeze_module_list='' # fully FT, e.g., freeze_module_list=""
|
| 4 |
+
data_mix=bridge_rt_1
|
| 5 |
+
|
| 6 |
+
## Modify below paths before running ##
|
| 7 |
+
date_time=$(date +%m%d_%H%M)
|
| 8 |
+
config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml
|
| 9 |
+
base_vlm=/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
|
| 10 |
+
data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
|
| 11 |
+
run_root_dir=./Checkpoints
|
| 12 |
+
run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
|
| 13 |
+
batch_size=8
|
| 14 |
+
wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
|
| 15 |
+
wandb_entity=lookas
|
| 16 |
+
|
| 17 |
+
# export WANDB_MODE=disabled
|
| 18 |
+
|
| 19 |
+
output_dir=${run_root_dir}/${run_id}
|
| 20 |
+
mkdir -p ${output_dir}
|
| 21 |
+
cp $0 ${output_dir}/
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
accelerate launch --main_process_port 12773 \
|
| 25 |
+
--config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 26 |
+
--num_processes 8 \
|
| 27 |
+
starVLA/training/train_starvla.py \
|
| 28 |
+
--config_yaml ${config_yaml} \
|
| 29 |
+
--framework.name ${Framework_name} \
|
| 30 |
+
--framework.qwenvl.base_vlm ${base_vlm} \
|
| 31 |
+
--datasets.vla_data.data_root_dir ${data_root_dir}\
|
| 32 |
+
--datasets.vla_data.data_mix ${data_mix} \
|
| 33 |
+
--datasets.vla_data.per_device_batch_size ${batch_size} \
|
| 34 |
+
--trainer.freeze_modules ${freeze_module_list} \
|
| 35 |
+
--trainer.max_train_steps 100000 \
|
| 36 |
+
--trainer.save_interval 10000 \
|
| 37 |
+
--trainer.logging_frequency 50 \
|
| 38 |
+
--trainer.eval_interval 200 \
|
| 39 |
+
--run_root_dir ${run_root_dir} \
|
| 40 |
+
--run_id ${run_id} \
|
| 41 |
+
--output_dir ${output_dir} \
|
| 42 |
+
--wandb.project ${wandb_project} \
|
| 43 |
+
--wandb.entity ${wandb_entity}
|
| 44 |
+
|
| 45 |
+
|
| 46 |
+
# multi-node launch example
|
| 47 |
+
|
| 48 |
+
# accelerate launch \
|
| 49 |
+
# --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 50 |
+
# --main_process_ip $MASTER_ADDR \
|
| 51 |
+
# --main_process_port $MASTER_PORT \
|
| 52 |
+
# --machine_rank $SLURM_PROCID \
|
| 53 |
+
# --num_machines $SLURM_NNODES \
|
| 54 |
+
# --num_processes=${TOTAL_GPUS} \
|
| 55 |
+
# starVLA/training/train_starvla.py \
|
| 56 |
+
# --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
|
| 57 |
+
# --framework.framework_py QwenGR00T \
|
| 58 |
+
# --framework.qwenvl.base_vlm microsoft/Florence-2-large \
|
| 59 |
+
# --run_root_dir ${run_root_dir} \
|
| 60 |
+
# --run_id ${run_id} \
|
| 61 |
+
# --wandb_project your_project \
|
| 62 |
+
# --wandb_entity your_name
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/summary.jsonl
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"steps": 10000}
|
| 2 |
+
{"steps": 20000}
|
| 3 |
+
{"steps": 30000}
|
| 4 |
+
{"steps": 40000}
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug-internal.log
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-12T13:32:42.27765521+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-12T13:32:45.284673898+08:00","level":"INFO","msg":"stream: created new stream","id":"xgfaxrjd"}
|
| 3 |
+
{"time":"2026-01-12T13:32:45.284920554+08:00","level":"INFO","msg":"handler: started","stream_id":"xgfaxrjd"}
|
| 4 |
+
{"time":"2026-01-12T13:32:45.310206106+08:00","level":"INFO","msg":"stream: started","id":"xgfaxrjd"}
|
| 5 |
+
{"time":"2026-01-12T13:32:45.310216651+08:00","level":"INFO","msg":"writer: started","stream_id":"xgfaxrjd"}
|
| 6 |
+
{"time":"2026-01-12T13:32:45.310224054+08:00","level":"INFO","msg":"sender: started","stream_id":"xgfaxrjd"}
|
| 7 |
+
{"time":"2026-01-12T14:18:28.350417757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 8 |
+
{"time":"2026-01-12T14:38:43.346919104+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 9 |
+
{"time":"2026-01-12T15:18:31.304717808+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded"}
|
| 10 |
+
{"time":"2026-01-12T15:52:59.271728136+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
|
| 11 |
+
{"time":"2026-01-12T18:50:56.901819762+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 12 |
+
{"time":"2026-01-12T18:51:26.812243249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 13 |
+
{"time":"2026-01-12T22:30:01.306180525+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 14 |
+
{"time":"2026-01-12T22:41:55.253842283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-13T03:06:46.307270176+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 16 |
+
{"time":"2026-01-13T03:12:11.798876383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 17 |
+
{"time":"2026-01-13T03:13:26.908899958+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 18 |
+
{"time":"2026-01-13T05:34:26.902207579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/output.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/requirements.txt
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
starVLA==1.0.1
|
| 2 |
+
absl-py==2.3.1
|
| 3 |
+
accelerate==1.5.2
|
| 4 |
+
albucore==0.0.17
|
| 5 |
+
albumentations==1.4.18
|
| 6 |
+
annotated-types==0.7.0
|
| 7 |
+
antlr4-python3-runtime==4.9.3
|
| 8 |
+
anyio==4.12.0
|
| 9 |
+
asttokens==3.0.1
|
| 10 |
+
attrs==20.3.0
|
| 11 |
+
av==12.3.0
|
| 12 |
+
bddl==1.0.1
|
| 13 |
+
certifi==2025.11.12
|
| 14 |
+
charset-normalizer==3.4.4
|
| 15 |
+
click==8.3.1
|
| 16 |
+
cloudpickle==3.1.2
|
| 17 |
+
contourpy==1.3.2
|
| 18 |
+
cramjam==2.11.0
|
| 19 |
+
cycler==0.12.1
|
| 20 |
+
debugpy==1.8.19
|
| 21 |
+
decorator==5.2.1
|
| 22 |
+
decord==0.6.0
|
| 23 |
+
deepspeed==0.16.9
|
| 24 |
+
diffusers==0.36.0
|
| 25 |
+
docstring_parser==0.17.0
|
| 26 |
+
easydict==1.9
|
| 27 |
+
einops==0.8.1
|
| 28 |
+
etils==1.13.0
|
| 29 |
+
eva-decord==0.6.1
|
| 30 |
+
eval_type_backport==0.3.1
|
| 31 |
+
exceptiongroup==1.3.1
|
| 32 |
+
executing==2.2.1
|
| 33 |
+
fastjsonschema==2.21.2
|
| 34 |
+
fastparquet==2024.11.0
|
| 35 |
+
filelock==3.20.2
|
| 36 |
+
flash_attn==2.8.3
|
| 37 |
+
fonttools==4.61.1
|
| 38 |
+
fsspec==2025.12.0
|
| 39 |
+
future==0.18.2
|
| 40 |
+
fvcore==0.1.5.post20221221
|
| 41 |
+
gevent==25.9.1
|
| 42 |
+
gitdb==4.0.12
|
| 43 |
+
GitPython==3.1.46
|
| 44 |
+
glfw==2.10.0
|
| 45 |
+
greenlet==3.3.0
|
| 46 |
+
grpcio==1.76.0
|
| 47 |
+
gym==0.26.2
|
| 48 |
+
gym-notices==0.1.0
|
| 49 |
+
h11==0.16.0
|
| 50 |
+
hf-xet==1.2.0
|
| 51 |
+
hjson==3.1.0
|
| 52 |
+
httpcore==1.0.9
|
| 53 |
+
httpx==0.28.1
|
| 54 |
+
huggingface-hub==0.36.0
|
| 55 |
+
idna==3.11
|
| 56 |
+
ImageIO==2.37.2
|
| 57 |
+
importlib_metadata==8.7.1
|
| 58 |
+
importlib_resources==6.5.2
|
| 59 |
+
iniconfig==2.3.0
|
| 60 |
+
iopath==0.1.10
|
| 61 |
+
ipdb==0.13.13
|
| 62 |
+
ipython==8.37.0
|
| 63 |
+
jedi==0.19.2
|
| 64 |
+
Jinja2==3.1.6
|
| 65 |
+
jsonschema==4.17.3
|
| 66 |
+
jupyter_core==5.9.1
|
| 67 |
+
jupytext==1.18.1
|
| 68 |
+
kiwisolver==1.4.9
|
| 69 |
+
lazy_loader==0.4
|
| 70 |
+
libero==0.1.0
|
| 71 |
+
llvmlite==0.46.0
|
| 72 |
+
Markdown==3.10
|
| 73 |
+
markdown-it-py==4.0.0
|
| 74 |
+
MarkupSafe==3.0.3
|
| 75 |
+
matplotlib==3.10.8
|
| 76 |
+
matplotlib-inline==0.2.1
|
| 77 |
+
mdit-py-plugins==0.5.0
|
| 78 |
+
mdurl==0.1.2
|
| 79 |
+
mpmath==1.3.0
|
| 80 |
+
msgpack==1.1.2
|
| 81 |
+
mujoco==3.4.0
|
| 82 |
+
nbformat==5.10.4
|
| 83 |
+
networkx==3.4.2
|
| 84 |
+
ninja==1.13.0
|
| 85 |
+
numba==0.63.1
|
| 86 |
+
numpy==1.26.4
|
| 87 |
+
numpydantic==1.6.9
|
| 88 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 89 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 90 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 91 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 92 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 93 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 94 |
+
nvidia-curand-cu12==10.3.5.147
|
| 95 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 96 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 97 |
+
nvidia-nccl-cu12==2.21.5
|
| 98 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 99 |
+
nvidia-nvtx-cu12==12.4.127
|
| 100 |
+
omegaconf==2.3.0
|
| 101 |
+
opencv-python==4.11.0.86
|
| 102 |
+
opencv-python-headless==4.11.0.86
|
| 103 |
+
packaging==25.0
|
| 104 |
+
pandas==2.3.3
|
| 105 |
+
parso==0.8.5
|
| 106 |
+
pexpect==4.9.0
|
| 107 |
+
pillow==12.1.0
|
| 108 |
+
pipablepytorch3d==0.7.6
|
| 109 |
+
platformdirs==4.5.1
|
| 110 |
+
pluggy==1.6.0
|
| 111 |
+
portalocker==3.2.0
|
| 112 |
+
prompt_toolkit==3.0.52
|
| 113 |
+
protobuf==6.33.2
|
| 114 |
+
psutil==7.2.1
|
| 115 |
+
ptyprocess==0.7.0
|
| 116 |
+
pure_eval==0.2.3
|
| 117 |
+
py-cpuinfo==9.0.0
|
| 118 |
+
pyarrow==14.0.1
|
| 119 |
+
pydantic==2.10.6
|
| 120 |
+
pydantic_core==2.27.2
|
| 121 |
+
Pygments==2.19.2
|
| 122 |
+
PyOpenGL==3.1.10
|
| 123 |
+
pyparsing==3.3.1
|
| 124 |
+
pyrsistent==0.20.0
|
| 125 |
+
pytest==9.0.2
|
| 126 |
+
python-dateutil==2.9.0.post0
|
| 127 |
+
pytz==2025.2
|
| 128 |
+
PyYAML==6.0.3
|
| 129 |
+
qwen-vl-utils==0.0.14
|
| 130 |
+
regex==2025.11.3
|
| 131 |
+
requests==2.32.5
|
| 132 |
+
rich==14.2.0
|
| 133 |
+
robosuite==1.4.0
|
| 134 |
+
safetensors==0.7.0
|
| 135 |
+
scikit-image==0.25.2
|
| 136 |
+
scipy==1.15.3
|
| 137 |
+
sentry-sdk==2.48.0
|
| 138 |
+
setuptools==80.9.0
|
| 139 |
+
six==1.17.0
|
| 140 |
+
smmap==5.0.2
|
| 141 |
+
stack-data==0.6.3
|
| 142 |
+
starVLA==1.0.1
|
| 143 |
+
sympy==1.13.1
|
| 144 |
+
tabulate==0.9.0
|
| 145 |
+
tensorboard==2.20.0
|
| 146 |
+
tensorboard-data-server==0.7.2
|
| 147 |
+
termcolor==3.3.0
|
| 148 |
+
tifffile==2025.5.10
|
| 149 |
+
tiktoken==0.12.0
|
| 150 |
+
timm==1.0.22
|
| 151 |
+
tokenizers==0.22.1
|
| 152 |
+
tomli==2.3.0
|
| 153 |
+
torch==2.5.1
|
| 154 |
+
torchvision==0.20.1
|
| 155 |
+
tqdm==4.67.1
|
| 156 |
+
traitlets==5.14.3
|
| 157 |
+
transformers==4.57.3
|
| 158 |
+
transformers-stream-generator==0.0.4
|
| 159 |
+
triton==3.1.0
|
| 160 |
+
typeguard==4.4.4
|
| 161 |
+
typing_extensions==4.15.0
|
| 162 |
+
tyro==1.0.3
|
| 163 |
+
tzdata==2025.3
|
| 164 |
+
urllib3==2.6.2
|
| 165 |
+
wandb==0.23.1
|
| 166 |
+
wcwidth==0.2.14
|
| 167 |
+
websocket==0.2.1
|
| 168 |
+
websocket-client==1.8.0
|
| 169 |
+
websockets==15.0.1
|
| 170 |
+
Werkzeug==3.1.4
|
| 171 |
+
yacs==0.1.8
|
| 172 |
+
zipp==3.23.0
|
| 173 |
+
zope.event==6.1
|
| 174 |
+
zope.interface==8.1.1
|
| 175 |
+
autocommand==2.2.2
|
| 176 |
+
backports.tarfile==1.2.0
|
| 177 |
+
importlib_metadata==8.0.0
|
| 178 |
+
inflect==7.3.1
|
| 179 |
+
jaraco.collections==5.1.0
|
| 180 |
+
jaraco.context==5.3.0
|
| 181 |
+
jaraco.functools==4.0.1
|
| 182 |
+
jaraco.text==3.12.1
|
| 183 |
+
more-itertools==10.3.0
|
| 184 |
+
packaging==24.2
|
| 185 |
+
platformdirs==4.2.2
|
| 186 |
+
tomli==2.0.1
|
| 187 |
+
typeguard==4.3.0
|
| 188 |
+
typing_extensions==4.12.2
|
| 189 |
+
wheel==0.45.1
|
| 190 |
+
zipp==3.19.2
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,122 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36",
|
| 3 |
+
"python": "CPython 3.10.19",
|
| 4 |
+
"startedAt": "2026-01-12T05:32:35.945274Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--config_yaml",
|
| 7 |
+
"scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml",
|
| 8 |
+
"--framework.name",
|
| 9 |
+
"QwenGR00T",
|
| 10 |
+
"--framework.qwenvl.base_vlm",
|
| 11 |
+
"/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b",
|
| 12 |
+
"--datasets.vla_data.data_root_dir",
|
| 13 |
+
"./playground/Datasets/OXE_LEROBOT",
|
| 14 |
+
"--datasets.vla_data.data_mix",
|
| 15 |
+
"bridge_rt_1",
|
| 16 |
+
"--datasets.vla_data.per_device_batch_size",
|
| 17 |
+
"8",
|
| 18 |
+
"--trainer.freeze_modules",
|
| 19 |
+
"--trainer.max_train_steps",
|
| 20 |
+
"100000",
|
| 21 |
+
"--trainer.save_interval",
|
| 22 |
+
"10000",
|
| 23 |
+
"--trainer.logging_frequency",
|
| 24 |
+
"50",
|
| 25 |
+
"--trainer.eval_interval",
|
| 26 |
+
"200",
|
| 27 |
+
"--run_root_dir",
|
| 28 |
+
"./Checkpoints",
|
| 29 |
+
"--run_id",
|
| 30 |
+
"qwen3vl_bridge_rt1_QwenGR00T_0112_1323",
|
| 31 |
+
"--output_dir",
|
| 32 |
+
"./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0112_1323",
|
| 33 |
+
"--wandb.project",
|
| 34 |
+
"Qwen3VL_Bridge_RT1_QwenGR00T",
|
| 35 |
+
"--wandb.entity",
|
| 36 |
+
"lookas"
|
| 37 |
+
],
|
| 38 |
+
"program": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py",
|
| 39 |
+
"codePath": "starVLA/training/train_starvla.py",
|
| 40 |
+
"codePathLocal": "starVLA/training/train_starvla.py",
|
| 41 |
+
"git": {
|
| 42 |
+
"remote": "https://github.com/hilookas/starVLA_pickxiguapi",
|
| 43 |
+
"commit": "ab531aff5b27795879c61f67892330a616e9dbf0"
|
| 44 |
+
},
|
| 45 |
+
"email": "hilookas@gmail.com",
|
| 46 |
+
"root": "./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb",
|
| 47 |
+
"host": "g340-cd51-7700-67c8-4915-9975-7e66",
|
| 48 |
+
"executable": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3",
|
| 49 |
+
"cpu_count": 90,
|
| 50 |
+
"cpu_count_logical": 180,
|
| 51 |
+
"gpu": "NVIDIA H20",
|
| 52 |
+
"gpu_count": 8,
|
| 53 |
+
"disk": {
|
| 54 |
+
"/": {
|
| 55 |
+
"total": "3779301580800",
|
| 56 |
+
"used": "139867217920"
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"memory": {
|
| 60 |
+
"total": "2071188119552"
|
| 61 |
+
},
|
| 62 |
+
"gpu_nvidia": [
|
| 63 |
+
{
|
| 64 |
+
"name": "NVIDIA H20",
|
| 65 |
+
"memoryTotal": "102625181696",
|
| 66 |
+
"cudaCores": 9984,
|
| 67 |
+
"architecture": "Hopper",
|
| 68 |
+
"uuid": "GPU-d59be83b-3536-1644-2091-0f4464032f14"
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"name": "NVIDIA H20",
|
| 72 |
+
"memoryTotal": "102625181696",
|
| 73 |
+
"cudaCores": 9984,
|
| 74 |
+
"architecture": "Hopper",
|
| 75 |
+
"uuid": "GPU-bc06cfc2-31e9-cd6e-d8cd-635061ed592f"
|
| 76 |
+
},
|
| 77 |
+
{
|
| 78 |
+
"name": "NVIDIA H20",
|
| 79 |
+
"memoryTotal": "102625181696",
|
| 80 |
+
"cudaCores": 9984,
|
| 81 |
+
"architecture": "Hopper",
|
| 82 |
+
"uuid": "GPU-019dac1d-8bed-5b35-1123-cbd9d65ba9de"
|
| 83 |
+
},
|
| 84 |
+
{
|
| 85 |
+
"name": "NVIDIA H20",
|
| 86 |
+
"memoryTotal": "102625181696",
|
| 87 |
+
"cudaCores": 9984,
|
| 88 |
+
"architecture": "Hopper",
|
| 89 |
+
"uuid": "GPU-9ac2a386-251e-3a51-5ac7-fa4b1357bc91"
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"name": "NVIDIA H20",
|
| 93 |
+
"memoryTotal": "102625181696",
|
| 94 |
+
"cudaCores": 9984,
|
| 95 |
+
"architecture": "Hopper",
|
| 96 |
+
"uuid": "GPU-1c0156f1-dfe3-af70-9511-34e6b131ef06"
|
| 97 |
+
},
|
| 98 |
+
{
|
| 99 |
+
"name": "NVIDIA H20",
|
| 100 |
+
"memoryTotal": "102625181696",
|
| 101 |
+
"cudaCores": 9984,
|
| 102 |
+
"architecture": "Hopper",
|
| 103 |
+
"uuid": "GPU-953d951d-56e0-a563-5ca6-5acc1f8559e3"
|
| 104 |
+
},
|
| 105 |
+
{
|
| 106 |
+
"name": "NVIDIA H20",
|
| 107 |
+
"memoryTotal": "102625181696",
|
| 108 |
+
"cudaCores": 9984,
|
| 109 |
+
"architecture": "Hopper",
|
| 110 |
+
"uuid": "GPU-70a05065-a0d0-7ff4-9204-e0714e9f25c4"
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "NVIDIA H20",
|
| 114 |
+
"memoryTotal": "102625181696",
|
| 115 |
+
"cudaCores": 9984,
|
| 116 |
+
"architecture": "Hopper",
|
| 117 |
+
"uuid": "GPU-daf390d3-2cbb-d20b-9fde-c5a09c17084b"
|
| 118 |
+
}
|
| 119 |
+
],
|
| 120 |
+
"cudaVersion": "12.4",
|
| 121 |
+
"writerId": "0zkhoms4zvynscihrkuls5t7ju1xvttv"
|
| 122 |
+
}
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-12T13:32:42.27765521+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-12T13:32:45.284673898+08:00","level":"INFO","msg":"stream: created new stream","id":"xgfaxrjd"}
|
| 3 |
+
{"time":"2026-01-12T13:32:45.284920554+08:00","level":"INFO","msg":"handler: started","stream_id":"xgfaxrjd"}
|
| 4 |
+
{"time":"2026-01-12T13:32:45.310206106+08:00","level":"INFO","msg":"stream: started","id":"xgfaxrjd"}
|
| 5 |
+
{"time":"2026-01-12T13:32:45.310216651+08:00","level":"INFO","msg":"writer: started","stream_id":"xgfaxrjd"}
|
| 6 |
+
{"time":"2026-01-12T13:32:45.310224054+08:00","level":"INFO","msg":"sender: started","stream_id":"xgfaxrjd"}
|
| 7 |
+
{"time":"2026-01-12T14:18:28.350417757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 8 |
+
{"time":"2026-01-12T14:38:43.346919104+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 9 |
+
{"time":"2026-01-12T15:18:31.304717808+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded"}
|
| 10 |
+
{"time":"2026-01-12T15:52:59.271728136+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
|
| 11 |
+
{"time":"2026-01-12T18:50:56.901819762+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 12 |
+
{"time":"2026-01-12T18:51:26.812243249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 13 |
+
{"time":"2026-01-12T22:30:01.306180525+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 14 |
+
{"time":"2026-01-12T22:41:55.253842283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-13T03:06:46.307270176+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 16 |
+
{"time":"2026-01-13T03:12:11.798876383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 17 |
+
{"time":"2026-01-13T03:13:26.908899958+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
| 18 |
+
{"time":"2026-01-13T05:34:26.902207579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xgfaxrjd/file_stream\": EOF"}
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/logs/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenGR00T_0112_1323/wandb/wandb/run-20260112_133235-xgfaxrjd/run-xgfaxrjd.wandb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:045e7281399b037c32de3a2f64aefac1cc2f8d4a536831b05f86c2df5f57c487
|
| 3 |
+
size 49053696
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/config.yaml
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
datasets:
|
| 2 |
+
vla_data:
|
| 3 |
+
CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
|
| 4 |
+
Locate their bounding boxes in [x1,y1,x2,y2] format.
|
| 5 |
+
data_mix: bridge_rt_1
|
| 6 |
+
data_root_dir: ./playground/Datasets/OXE_LEROBOT
|
| 7 |
+
dataset_py: lerobot_datasets
|
| 8 |
+
image_size:
|
| 9 |
+
- 224
|
| 10 |
+
- 224
|
| 11 |
+
per_device_batch_size: 8
|
| 12 |
+
video_backend: torchvision_av
|
| 13 |
+
framework:
|
| 14 |
+
action_model:
|
| 15 |
+
action_dim: 7
|
| 16 |
+
action_horizon: 16
|
| 17 |
+
action_model_type: DiT-B
|
| 18 |
+
add_pos_embed: true
|
| 19 |
+
diffusion_model_cfg:
|
| 20 |
+
cross_attention_dim: 4096
|
| 21 |
+
dropout: 0.2
|
| 22 |
+
final_dropout: true
|
| 23 |
+
interleave_self_attention: true
|
| 24 |
+
norm_type: ada_norm
|
| 25 |
+
num_layers: 16
|
| 26 |
+
output_dim: 1024
|
| 27 |
+
positional_embeddings: null
|
| 28 |
+
future_action_window_size: 15
|
| 29 |
+
hidden_size: 1024
|
| 30 |
+
max_seq_len: 1024
|
| 31 |
+
noise_beta_alpha: 1.5
|
| 32 |
+
noise_beta_beta: 1.0
|
| 33 |
+
noise_s: 0.999
|
| 34 |
+
num_inference_timesteps: 4
|
| 35 |
+
num_target_vision_tokens: 32
|
| 36 |
+
num_timestep_buckets: 1000
|
| 37 |
+
past_action_window_size: 0
|
| 38 |
+
state_dim: 7
|
| 39 |
+
name: QwenGR00T
|
| 40 |
+
qwenvl:
|
| 41 |
+
base_vlm: /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
|
| 42 |
+
output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747
|
| 43 |
+
run_id: qwen3vl_bridge_rt1_QwenGR00T_0117_1747
|
| 44 |
+
run_root_dir: ./Checkpoints
|
| 45 |
+
seed: 42
|
| 46 |
+
trainer:
|
| 47 |
+
eval_interval: 200
|
| 48 |
+
freeze_modules: true
|
| 49 |
+
gradient_accumulation_steps: 1
|
| 50 |
+
gradient_clipping: 1.0
|
| 51 |
+
is_resume: false
|
| 52 |
+
learning_rate:
|
| 53 |
+
action_model: 0.0001
|
| 54 |
+
base: 1.0e-05
|
| 55 |
+
qwen_vl_interface: 1.0e-05
|
| 56 |
+
logging_frequency: 50
|
| 57 |
+
lr_scheduler_type: cosine_with_min_lr
|
| 58 |
+
max_train_steps: 100000
|
| 59 |
+
num_warmup_steps: 10000
|
| 60 |
+
optimizer:
|
| 61 |
+
betas:
|
| 62 |
+
- 0.9
|
| 63 |
+
- 0.95
|
| 64 |
+
eps: 1.0e-08
|
| 65 |
+
weight_decay: 1.0e-08
|
| 66 |
+
repeated_diffusion_steps: 4
|
| 67 |
+
save_interval: 10000
|
| 68 |
+
scheduler_specific_kwargs:
|
| 69 |
+
min_lr: 5.0e-07
|
| 70 |
+
wandb_entity: lookas
|
| 71 |
+
wandb_project: Qwen3VL_Bridge_RT1_GR00T
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/dataset_statistics.json
ADDED
|
@@ -0,0 +1,264 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"oxe_bridge": {
|
| 3 |
+
"action": {
|
| 4 |
+
"mean": [
|
| 5 |
+
0.00011365935642970726,
|
| 6 |
+
6.556110747624189e-05,
|
| 7 |
+
-6.320965621853247e-05,
|
| 8 |
+
-7.205353176686913e-05,
|
| 9 |
+
-0.00019515302847139537,
|
| 10 |
+
0.0001203166029881686,
|
| 11 |
+
0.28829458355903625
|
| 12 |
+
],
|
| 13 |
+
"std": [
|
| 14 |
+
0.006909770731857718,
|
| 15 |
+
0.009684093232852218,
|
| 16 |
+
0.00896290498528129,
|
| 17 |
+
0.020121052930683073,
|
| 18 |
+
0.021582655517295487,
|
| 19 |
+
0.054723342223346974,
|
| 20 |
+
0.4543627821514982
|
| 21 |
+
],
|
| 22 |
+
"max": [
|
| 23 |
+
0.41691166162490845,
|
| 24 |
+
0.25864794850349426,
|
| 25 |
+
0.21218234300613403,
|
| 26 |
+
3.122201919555664,
|
| 27 |
+
1.8618112802505493,
|
| 28 |
+
6.272472858428955,
|
| 29 |
+
1.0
|
| 30 |
+
],
|
| 31 |
+
"min": [
|
| 32 |
+
-0.4007510244846344,
|
| 33 |
+
-0.13874775171279907,
|
| 34 |
+
-0.22553899884223938,
|
| 35 |
+
-3.2010786533355713,
|
| 36 |
+
-1.8618112802505493,
|
| 37 |
+
-6.279075622558594,
|
| 38 |
+
0.0
|
| 39 |
+
],
|
| 40 |
+
"q01": [
|
| 41 |
+
-0.02875255048274994,
|
| 42 |
+
-0.04170213546603918,
|
| 43 |
+
-0.026096721179783344,
|
| 44 |
+
-0.08052874729037285,
|
| 45 |
+
-0.09249906800687313,
|
| 46 |
+
-0.20738555490970612,
|
| 47 |
+
0.0
|
| 48 |
+
],
|
| 49 |
+
"q99": [
|
| 50 |
+
0.028306663036346436,
|
| 51 |
+
0.04089853074401617,
|
| 52 |
+
0.0401805154979229,
|
| 53 |
+
0.08173403143882751,
|
| 54 |
+
0.07760760560631752,
|
| 55 |
+
0.2038465365767479,
|
| 56 |
+
1.0
|
| 57 |
+
],
|
| 58 |
+
"mask": [
|
| 59 |
+
true,
|
| 60 |
+
true,
|
| 61 |
+
true,
|
| 62 |
+
true,
|
| 63 |
+
true,
|
| 64 |
+
true,
|
| 65 |
+
false
|
| 66 |
+
]
|
| 67 |
+
},
|
| 68 |
+
"state": {
|
| 69 |
+
"mean": [
|
| 70 |
+
0.15471743047237396,
|
| 71 |
+
0.015362550504505634,
|
| 72 |
+
0.03222028166055679,
|
| 73 |
+
0.0032453201711177826,
|
| 74 |
+
-0.038600146770477295,
|
| 75 |
+
0.05382946878671646,
|
| 76 |
+
0.0,
|
| 77 |
+
0.35406652092933655
|
| 78 |
+
],
|
| 79 |
+
"std": [
|
| 80 |
+
0.1605359274864927,
|
| 81 |
+
0.06677912092232112,
|
| 82 |
+
0.048657150951527554,
|
| 83 |
+
0.09275336958940797,
|
| 84 |
+
0.12566984746914736,
|
| 85 |
+
0.41222738578801793,
|
| 86 |
+
0.0,
|
| 87 |
+
0.4330223535305803
|
| 88 |
+
],
|
| 89 |
+
"max": [
|
| 90 |
+
0.5862360596656799,
|
| 91 |
+
0.4034728705883026,
|
| 92 |
+
0.3568263053894043,
|
| 93 |
+
1.3517684936523438,
|
| 94 |
+
1.570796251296997,
|
| 95 |
+
3.141204357147217,
|
| 96 |
+
0.0,
|
| 97 |
+
1.1121242046356201
|
| 98 |
+
],
|
| 99 |
+
"min": [
|
| 100 |
+
-0.04167502000927925,
|
| 101 |
+
-0.3563207685947418,
|
| 102 |
+
-0.15537554025650024,
|
| 103 |
+
-3.141592502593994,
|
| 104 |
+
-1.4992541074752808,
|
| 105 |
+
-3.14153790473938,
|
| 106 |
+
0.0,
|
| 107 |
+
0.04637829214334488
|
| 108 |
+
],
|
| 109 |
+
"q01": [
|
| 110 |
+
0.17102622985839844,
|
| 111 |
+
-0.1698118858039379,
|
| 112 |
+
-0.055632163770496845,
|
| 113 |
+
-0.36493172496557236,
|
| 114 |
+
-0.541871190071106,
|
| 115 |
+
-1.354275494813919,
|
| 116 |
+
0.0,
|
| 117 |
+
0.052190229296684265
|
| 118 |
+
],
|
| 119 |
+
"q99": [
|
| 120 |
+
0.45322076976299286,
|
| 121 |
+
0.2354845181107521,
|
| 122 |
+
0.19489620998501778,
|
| 123 |
+
0.3780156075954437,
|
| 124 |
+
0.27568644285202026,
|
| 125 |
+
1.8500566184520721,
|
| 126 |
+
0.0,
|
| 127 |
+
1.0105689764022827
|
| 128 |
+
]
|
| 129 |
+
},
|
| 130 |
+
"num_transitions": 1305714,
|
| 131 |
+
"num_trajectories": 53192
|
| 132 |
+
},
|
| 133 |
+
"oxe_rt1": {
|
| 134 |
+
"action": {
|
| 135 |
+
"mean": [
|
| 136 |
+
0.003493750700727105,
|
| 137 |
+
0.003132961690425873,
|
| 138 |
+
-0.0063125672750175,
|
| 139 |
+
0.02166595682501793,
|
| 140 |
+
-0.0028780836146324873,
|
| 141 |
+
0.0004565489653032273,
|
| 142 |
+
0.26771023869514465
|
| 143 |
+
],
|
| 144 |
+
"std": [
|
| 145 |
+
0.049065014465362655,
|
| 146 |
+
0.04229853739828572,
|
| 147 |
+
0.05237628880142378,
|
| 148 |
+
0.1124860236500875,
|
| 149 |
+
0.09312952783816872,
|
| 150 |
+
0.10319098309601091,
|
| 151 |
+
0.4418448662622395
|
| 152 |
+
],
|
| 153 |
+
"max": [
|
| 154 |
+
2.9984593391418457,
|
| 155 |
+
22.09052848815918,
|
| 156 |
+
2.7507524490356445,
|
| 157 |
+
1.570636510848999,
|
| 158 |
+
1.5321086645126343,
|
| 159 |
+
1.5691522359848022,
|
| 160 |
+
1.0
|
| 161 |
+
],
|
| 162 |
+
"min": [
|
| 163 |
+
-2.0204520225524902,
|
| 164 |
+
-5.497899532318115,
|
| 165 |
+
-2.031663417816162,
|
| 166 |
+
-1.569917917251587,
|
| 167 |
+
-1.569892168045044,
|
| 168 |
+
-1.570419430732727,
|
| 169 |
+
0.0
|
| 170 |
+
],
|
| 171 |
+
"q01": [
|
| 172 |
+
-0.22453527510166169,
|
| 173 |
+
-0.14820013284683228,
|
| 174 |
+
-0.231589707583189,
|
| 175 |
+
-0.3517994859814644,
|
| 176 |
+
-0.4193011274933815,
|
| 177 |
+
-0.43643461108207704,
|
| 178 |
+
0.0
|
| 179 |
+
],
|
| 180 |
+
"q99": [
|
| 181 |
+
0.17824687153100965,
|
| 182 |
+
0.14938379630446405,
|
| 183 |
+
0.21842354819178575,
|
| 184 |
+
0.5892666035890578,
|
| 185 |
+
0.35272657424211445,
|
| 186 |
+
0.44796681255102094,
|
| 187 |
+
1.0
|
| 188 |
+
],
|
| 189 |
+
"mask": [
|
| 190 |
+
true,
|
| 191 |
+
true,
|
| 192 |
+
true,
|
| 193 |
+
true,
|
| 194 |
+
true,
|
| 195 |
+
true,
|
| 196 |
+
false
|
| 197 |
+
]
|
| 198 |
+
},
|
| 199 |
+
"state": {
|
| 200 |
+
"mean": [
|
| 201 |
+
0.2799473702907562,
|
| 202 |
+
-0.04167069122195244,
|
| 203 |
+
0.38854750990867615,
|
| 204 |
+
0.21306729316711426,
|
| 205 |
+
-0.12402277439832687,
|
| 206 |
+
0.24756911396980286,
|
| 207 |
+
0.046330634504556656,
|
| 208 |
+
0.10487449914216995
|
| 209 |
+
],
|
| 210 |
+
"std": [
|
| 211 |
+
0.29342642876909925,
|
| 212 |
+
0.09174024655686211,
|
| 213 |
+
0.42569508885539115,
|
| 214 |
+
0.38616252611341306,
|
| 215 |
+
0.38314586427420927,
|
| 216 |
+
0.44433568806919804,
|
| 217 |
+
0.1263927443679382,
|
| 218 |
+
0.22122596673781084
|
| 219 |
+
],
|
| 220 |
+
"max": [
|
| 221 |
+
1.0534898042678833,
|
| 222 |
+
0.48018959164619446,
|
| 223 |
+
1.6896663904190063,
|
| 224 |
+
1.0,
|
| 225 |
+
0.9999993443489075,
|
| 226 |
+
0.9999874830245972,
|
| 227 |
+
0.9554369449615479,
|
| 228 |
+
0.9914546012878418
|
| 229 |
+
],
|
| 230 |
+
"min": [
|
| 231 |
+
-0.4436439275741577,
|
| 232 |
+
-0.9970501065254211,
|
| 233 |
+
-0.006579156965017319,
|
| 234 |
+
0.0,
|
| 235 |
+
-0.8643477559089661,
|
| 236 |
+
-0.7079970240592957,
|
| 237 |
+
-0.7688722014427185,
|
| 238 |
+
-0.4999994933605194
|
| 239 |
+
],
|
| 240 |
+
"q01": [
|
| 241 |
+
0.32481380939483645,
|
| 242 |
+
-0.28334290891885755,
|
| 243 |
+
0.14107070609927178,
|
| 244 |
+
0.0,
|
| 245 |
+
-0.686474204659462,
|
| 246 |
+
-0.6808923494815826,
|
| 247 |
+
-0.36045596331357954,
|
| 248 |
+
-0.454380963742733
|
| 249 |
+
],
|
| 250 |
+
"q99": [
|
| 251 |
+
0.8750156319141384,
|
| 252 |
+
0.21247054174542404,
|
| 253 |
+
1.0727112340927123,
|
| 254 |
+
1.0,
|
| 255 |
+
0.9377871316671368,
|
| 256 |
+
0.9563051050901409,
|
| 257 |
+
0.45990042358636823,
|
| 258 |
+
0.7216041100025177
|
| 259 |
+
]
|
| 260 |
+
},
|
| 261 |
+
"num_transitions": 3786152,
|
| 262 |
+
"num_trajectories": 87212
|
| 263 |
+
}
|
| 264 |
+
}
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/run_qwen3vl_bridge_rt1_qwen_gr00t.sh
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Framework_name=QwenGR00T
|
| 2 |
+
dit_type="DiT-B"
|
| 3 |
+
freeze_module_list='' # fully FT, e.g., freeze_module_list=""
|
| 4 |
+
data_mix=bridge_rt_1
|
| 5 |
+
|
| 6 |
+
## Modify below paths before running ##
|
| 7 |
+
date_time=$(date +%m%d_%H%M)
|
| 8 |
+
config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml
|
| 9 |
+
base_vlm=/home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
|
| 10 |
+
data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
|
| 11 |
+
run_root_dir=./Checkpoints
|
| 12 |
+
run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
|
| 13 |
+
batch_size=8
|
| 14 |
+
wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
|
| 15 |
+
wandb_entity=lookas
|
| 16 |
+
|
| 17 |
+
# export WANDB_MODE=disabled
|
| 18 |
+
|
| 19 |
+
output_dir=${run_root_dir}/${run_id}
|
| 20 |
+
mkdir -p ${output_dir}
|
| 21 |
+
cp $0 ${output_dir}/
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
accelerate launch --main_process_port 12773 \
|
| 25 |
+
--config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 26 |
+
--num_processes 8 \
|
| 27 |
+
starVLA/training/train_starvla.py \
|
| 28 |
+
--config_yaml ${config_yaml} \
|
| 29 |
+
--framework.name ${Framework_name} \
|
| 30 |
+
--framework.qwenvl.base_vlm ${base_vlm} \
|
| 31 |
+
--datasets.vla_data.data_root_dir ${data_root_dir}\
|
| 32 |
+
--datasets.vla_data.data_mix ${data_mix} \
|
| 33 |
+
--datasets.vla_data.per_device_batch_size ${batch_size} \
|
| 34 |
+
--trainer.freeze_modules ${freeze_module_list} \
|
| 35 |
+
--trainer.max_train_steps 100000 \
|
| 36 |
+
--trainer.save_interval 10000 \
|
| 37 |
+
--trainer.logging_frequency 50 \
|
| 38 |
+
--trainer.eval_interval 200 \
|
| 39 |
+
--run_root_dir ${run_root_dir} \
|
| 40 |
+
--run_id ${run_id} \
|
| 41 |
+
--output_dir ${output_dir} \
|
| 42 |
+
--wandb.project ${wandb_project} \
|
| 43 |
+
--wandb.entity ${wandb_entity}
|
| 44 |
+
|
| 45 |
+
|
| 46 |
+
# multi-node launch example
|
| 47 |
+
|
| 48 |
+
# accelerate launch \
|
| 49 |
+
# --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 50 |
+
# --main_process_ip $MASTER_ADDR \
|
| 51 |
+
# --main_process_port $MASTER_PORT \
|
| 52 |
+
# --machine_rank $SLURM_PROCID \
|
| 53 |
+
# --num_machines $SLURM_NNODES \
|
| 54 |
+
# --num_processes=${TOTAL_GPUS} \
|
| 55 |
+
# starVLA/training/train_starvla.py \
|
| 56 |
+
# --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
|
| 57 |
+
# --framework.framework_py QwenGR00T \
|
| 58 |
+
# --framework.qwenvl.base_vlm microsoft/Florence-2-large \
|
| 59 |
+
# --run_root_dir ${run_root_dir} \
|
| 60 |
+
# --run_id ${run_id} \
|
| 61 |
+
# --wandb_project your_project \
|
| 62 |
+
# --wandb_entity your_name
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/summary.jsonl
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"steps": 10000}
|
| 2 |
+
{"steps": 20000}
|
| 3 |
+
{"steps": 30000}
|
| 4 |
+
{"steps": 40000}
|
| 5 |
+
{"steps": 50000}
|
| 6 |
+
{"steps": 60000}
|
| 7 |
+
{"steps": 70000}
|
| 8 |
+
{"steps": 80000}
|
| 9 |
+
{"steps": 90000}
|
| 10 |
+
{"steps": 100000}
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug-internal.log
ADDED
|
@@ -0,0 +1,89 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-17T18:03:45.356692165+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-17T18:03:48.552330417+08:00","level":"INFO","msg":"stream: created new stream","id":"xbap43rk"}
|
| 3 |
+
{"time":"2026-01-17T18:03:48.552524112+08:00","level":"INFO","msg":"handler: started","stream_id":"xbap43rk"}
|
| 4 |
+
{"time":"2026-01-17T18:03:48.577796615+08:00","level":"INFO","msg":"stream: started","id":"xbap43rk"}
|
| 5 |
+
{"time":"2026-01-17T18:03:48.577817586+08:00","level":"INFO","msg":"writer: started","stream_id":"xbap43rk"}
|
| 6 |
+
{"time":"2026-01-17T18:03:48.577832655+08:00","level":"INFO","msg":"sender: started","stream_id":"xbap43rk"}
|
| 7 |
+
{"time":"2026-01-17T20:02:17.852359064+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 8 |
+
{"time":"2026-01-17T20:04:33.007831623+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 9 |
+
{"time":"2026-01-17T20:35:32.863685268+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 10 |
+
{"time":"2026-01-17T22:03:46.318542143+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 11 |
+
{"time":"2026-01-17T22:48:34.635180932+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 12 |
+
{"time":"2026-01-17T22:55:57.518503703+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 13 |
+
{"time":"2026-01-17T23:07:48.293218261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 14 |
+
{"time":"2026-01-17T23:08:32.231325893+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-17T23:12:50.87203047+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 16 |
+
{"time":"2026-01-17T23:13:18.698788758+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": http2: client conn is closed"}
|
| 17 |
+
{"time":"2026-01-17T23:16:49.881636821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-01-17T23:25:00.472362504+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-01-18T00:16:02.236615436+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-01-18T00:33:00.268425846+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 21 |
+
{"time":"2026-01-18T00:33:13.186386827+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 22 |
+
{"time":"2026-01-18T02:52:45.26127457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 23 |
+
{"time":"2026-01-18T02:53:30.366178096+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 24 |
+
{"time":"2026-01-18T04:54:45.36780745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 25 |
+
{"time":"2026-01-18T04:55:30.238642915+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 26 |
+
{"time":"2026-01-18T04:55:42.722661208+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 27 |
+
{"time":"2026-01-18T04:56:15.382797183+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 28 |
+
{"time":"2026-01-18T08:43:45.342343851+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 29 |
+
{"time":"2026-01-18T08:44:00.358330288+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 30 |
+
{"time":"2026-01-18T08:44:30.251461638+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 31 |
+
{"time":"2026-01-18T10:47:45.345590419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 32 |
+
{"time":"2026-01-18T12:47:15.286316861+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 33 |
+
{"time":"2026-01-18T13:40:46.383240786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 34 |
+
{"time":"2026-01-18T16:22:00.269227917+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 35 |
+
{"time":"2026-01-18T16:23:00.259212087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 36 |
+
{"time":"2026-01-18T16:26:15.279544821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 37 |
+
{"time":"2026-01-18T16:28:15.394951264+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 38 |
+
{"time":"2026-01-18T16:28:28.376139107+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 39 |
+
{"time":"2026-01-18T16:32:34.771745298+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 40 |
+
{"time":"2026-01-18T16:32:50.854108579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 41 |
+
{"time":"2026-01-18T16:33:15.253909146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 42 |
+
{"time":"2026-01-18T16:33:30.268871735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 43 |
+
{"time":"2026-01-18T16:33:45.254149217+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 44 |
+
{"time":"2026-01-18T16:33:57.84608755+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 45 |
+
{"time":"2026-01-18T16:34:14.118425621+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 46 |
+
{"time":"2026-01-18T16:34:26.791643445+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 47 |
+
{"time":"2026-01-18T16:35:30.392649391+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 48 |
+
{"time":"2026-01-18T16:35:45.390391138+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 49 |
+
{"time":"2026-01-18T16:37:00.231753869+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 50 |
+
{"time":"2026-01-18T16:39:00.308923433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 51 |
+
{"time":"2026-01-18T16:50:44.109993399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 52 |
+
{"time":"2026-01-18T16:56:44.222721195+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 53 |
+
{"time":"2026-01-18T16:56:59.182350472+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 54 |
+
{"time":"2026-01-18T16:57:12.200012616+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 55 |
+
{"time":"2026-01-18T16:57:30.278294605+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 56 |
+
{"time":"2026-01-18T16:57:45.272613563+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 57 |
+
{"time":"2026-01-18T16:57:58.361466419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 58 |
+
{"time":"2026-01-18T16:58:16.374502713+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 59 |
+
{"time":"2026-01-18T17:01:49.770643385+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 60 |
+
{"time":"2026-01-18T17:03:00.288457229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 61 |
+
{"time":"2026-01-18T17:03:45.353334974+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 62 |
+
{"time":"2026-01-18T18:17:45.365055726+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 63 |
+
{"time":"2026-01-18T18:24:00.357867283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 64 |
+
{"time":"2026-01-18T19:06:15.375047877+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 65 |
+
{"time":"2026-01-18T19:06:28.413756607+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 66 |
+
{"time":"2026-01-18T19:15:30.232002999+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 67 |
+
{"time":"2026-01-18T19:39:30.251864251+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 68 |
+
{"time":"2026-01-18T19:40:00.288831216+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 69 |
+
{"time":"2026-01-18T19:52:30.252619907+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 70 |
+
{"time":"2026-01-18T20:51:49.773485296+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 71 |
+
{"time":"2026-01-18T21:32:54.188737252+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 72 |
+
{"time":"2026-01-18T22:14:31.789385651+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 73 |
+
{"time":"2026-01-19T00:11:15.393839366+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 74 |
+
{"time":"2026-01-19T00:50:30.380524837+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 75 |
+
{"time":"2026-01-19T00:51:00.395000654+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 76 |
+
{"time":"2026-01-19T00:51:13.162530742+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 77 |
+
{"time":"2026-01-19T00:54:30.249839041+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 78 |
+
{"time":"2026-01-19T00:55:30.349433303+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 79 |
+
{"time":"2026-01-19T01:00:31.333972122+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 80 |
+
{"time":"2026-01-19T01:19:30.367251508+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 81 |
+
{"time":"2026-01-19T01:20:30.296201955+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 82 |
+
{"time":"2026-01-19T01:51:00.221611746+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 83 |
+
{"time":"2026-01-19T01:52:30.445846213+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 84 |
+
{"time":"2026-01-19T02:02:15.651403576+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 85 |
+
{"time":"2026-01-19T02:02:17.343084437+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
|
| 86 |
+
{"time":"2026-01-19T02:02:17.352284781+08:00","level":"INFO","msg":"stream: closing","id":"xbap43rk"}
|
| 87 |
+
{"time":"2026-01-19T02:02:17.35229661+08:00","level":"INFO","msg":"handler: closed","stream_id":"xbap43rk"}
|
| 88 |
+
{"time":"2026-01-19T02:02:17.384196864+08:00","level":"INFO","msg":"sender: closed","stream_id":"xbap43rk"}
|
| 89 |
+
{"time":"2026-01-19T02:02:17.384209276+08:00","level":"INFO","msg":"stream: closed","id":"xbap43rk"}
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/config.yaml
ADDED
|
@@ -0,0 +1,133 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_wandb:
|
| 2 |
+
value:
|
| 3 |
+
cli_version: 0.23.1
|
| 4 |
+
e:
|
| 5 |
+
qsdugxujhb6s3j19wae2dfqwajsgmsw2:
|
| 6 |
+
args:
|
| 7 |
+
- --config_yaml
|
| 8 |
+
- scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml
|
| 9 |
+
- --framework.name
|
| 10 |
+
- QwenGR00T
|
| 11 |
+
- --framework.qwenvl.base_vlm
|
| 12 |
+
- /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
|
| 13 |
+
- --datasets.vla_data.data_root_dir
|
| 14 |
+
- ./playground/Datasets/OXE_LEROBOT
|
| 15 |
+
- --datasets.vla_data.data_mix
|
| 16 |
+
- bridge_rt_1
|
| 17 |
+
- --datasets.vla_data.per_device_batch_size
|
| 18 |
+
- "8"
|
| 19 |
+
- --trainer.freeze_modules
|
| 20 |
+
- --trainer.max_train_steps
|
| 21 |
+
- "100000"
|
| 22 |
+
- --trainer.save_interval
|
| 23 |
+
- "10000"
|
| 24 |
+
- --trainer.logging_frequency
|
| 25 |
+
- "50"
|
| 26 |
+
- --trainer.eval_interval
|
| 27 |
+
- "200"
|
| 28 |
+
- --run_root_dir
|
| 29 |
+
- ./Checkpoints
|
| 30 |
+
- --run_id
|
| 31 |
+
- qwen3vl_bridge_rt1_QwenGR00T_0117_1747
|
| 32 |
+
- --output_dir
|
| 33 |
+
- ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747
|
| 34 |
+
- --wandb.project
|
| 35 |
+
- Qwen3VL_Bridge_RT1_QwenGR00T
|
| 36 |
+
- --wandb.entity
|
| 37 |
+
- lookas
|
| 38 |
+
codePath: starVLA/training/train_starvla.py
|
| 39 |
+
codePathLocal: starVLA/training/train_starvla.py
|
| 40 |
+
cpu_count: 90
|
| 41 |
+
cpu_count_logical: 180
|
| 42 |
+
cudaVersion: "12.4"
|
| 43 |
+
disk:
|
| 44 |
+
/:
|
| 45 |
+
total: "3779301580800"
|
| 46 |
+
used: "151673700352"
|
| 47 |
+
email: hilookas@gmail.com
|
| 48 |
+
executable: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3
|
| 49 |
+
git:
|
| 50 |
+
commit: ab531aff5b27795879c61f67892330a616e9dbf0
|
| 51 |
+
remote: https://github.com/hilookas/starVLA_pickxiguapi
|
| 52 |
+
gpu: NVIDIA H20
|
| 53 |
+
gpu_count: 8
|
| 54 |
+
gpu_nvidia:
|
| 55 |
+
- architecture: Hopper
|
| 56 |
+
cudaCores: 9984
|
| 57 |
+
memoryTotal: "102625181696"
|
| 58 |
+
name: NVIDIA H20
|
| 59 |
+
uuid: GPU-f99bae5f-ffca-4972-6420-64c42ba64f22
|
| 60 |
+
- architecture: Hopper
|
| 61 |
+
cudaCores: 9984
|
| 62 |
+
memoryTotal: "102625181696"
|
| 63 |
+
name: NVIDIA H20
|
| 64 |
+
uuid: GPU-a00709c9-6bdf-4011-64dc-95421da94ba4
|
| 65 |
+
- architecture: Hopper
|
| 66 |
+
cudaCores: 9984
|
| 67 |
+
memoryTotal: "102625181696"
|
| 68 |
+
name: NVIDIA H20
|
| 69 |
+
uuid: GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5
|
| 70 |
+
- architecture: Hopper
|
| 71 |
+
cudaCores: 9984
|
| 72 |
+
memoryTotal: "102625181696"
|
| 73 |
+
name: NVIDIA H20
|
| 74 |
+
uuid: GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9
|
| 75 |
+
- architecture: Hopper
|
| 76 |
+
cudaCores: 9984
|
| 77 |
+
memoryTotal: "102625181696"
|
| 78 |
+
name: NVIDIA H20
|
| 79 |
+
uuid: GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218
|
| 80 |
+
- architecture: Hopper
|
| 81 |
+
cudaCores: 9984
|
| 82 |
+
memoryTotal: "102625181696"
|
| 83 |
+
name: NVIDIA H20
|
| 84 |
+
uuid: GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde
|
| 85 |
+
- architecture: Hopper
|
| 86 |
+
cudaCores: 9984
|
| 87 |
+
memoryTotal: "102625181696"
|
| 88 |
+
name: NVIDIA H20
|
| 89 |
+
uuid: GPU-4fa493fc-c408-182f-138e-bcc15c7f9138
|
| 90 |
+
- architecture: Hopper
|
| 91 |
+
cudaCores: 9984
|
| 92 |
+
memoryTotal: "102625181696"
|
| 93 |
+
name: NVIDIA H20
|
| 94 |
+
uuid: GPU-16ef9185-6132-8620-ad2e-1f8920ded508
|
| 95 |
+
host: g340-cd51-7700-770-343f-3fec-69bb
|
| 96 |
+
memory:
|
| 97 |
+
total: "2071188119552"
|
| 98 |
+
os: Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36
|
| 99 |
+
program: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py
|
| 100 |
+
python: CPython 3.10.19
|
| 101 |
+
root: ./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb
|
| 102 |
+
startedAt: "2026-01-17T10:03:39.069637Z"
|
| 103 |
+
writerId: qsdugxujhb6s3j19wae2dfqwajsgmsw2
|
| 104 |
+
m: []
|
| 105 |
+
python_version: 3.10.19
|
| 106 |
+
t:
|
| 107 |
+
"1":
|
| 108 |
+
- 1
|
| 109 |
+
- 11
|
| 110 |
+
- 41
|
| 111 |
+
- 49
|
| 112 |
+
- 63
|
| 113 |
+
- 71
|
| 114 |
+
- 80
|
| 115 |
+
- 83
|
| 116 |
+
"2":
|
| 117 |
+
- 1
|
| 118 |
+
- 11
|
| 119 |
+
- 41
|
| 120 |
+
- 49
|
| 121 |
+
- 63
|
| 122 |
+
- 71
|
| 123 |
+
- 80
|
| 124 |
+
- 83
|
| 125 |
+
"3":
|
| 126 |
+
- 2
|
| 127 |
+
- 13
|
| 128 |
+
- 61
|
| 129 |
+
"4": 3.10.19
|
| 130 |
+
"5": 0.23.1
|
| 131 |
+
"6": 4.57.3
|
| 132 |
+
"12": 0.23.1
|
| 133 |
+
"13": linux-x86_64
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/output.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/requirements.txt
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
starVLA==1.0.1
|
| 2 |
+
absl-py==2.3.1
|
| 3 |
+
accelerate==1.5.2
|
| 4 |
+
albucore==0.0.17
|
| 5 |
+
albumentations==1.4.18
|
| 6 |
+
annotated-types==0.7.0
|
| 7 |
+
antlr4-python3-runtime==4.9.3
|
| 8 |
+
anyio==4.12.0
|
| 9 |
+
asttokens==3.0.1
|
| 10 |
+
attrs==20.3.0
|
| 11 |
+
av==12.3.0
|
| 12 |
+
bddl==1.0.1
|
| 13 |
+
certifi==2025.11.12
|
| 14 |
+
charset-normalizer==3.4.4
|
| 15 |
+
click==8.3.1
|
| 16 |
+
cloudpickle==3.1.2
|
| 17 |
+
contourpy==1.3.2
|
| 18 |
+
cramjam==2.11.0
|
| 19 |
+
cycler==0.12.1
|
| 20 |
+
debugpy==1.8.19
|
| 21 |
+
decorator==5.2.1
|
| 22 |
+
decord==0.6.0
|
| 23 |
+
deepspeed==0.16.9
|
| 24 |
+
diffusers==0.36.0
|
| 25 |
+
docstring_parser==0.17.0
|
| 26 |
+
easydict==1.9
|
| 27 |
+
einops==0.8.1
|
| 28 |
+
etils==1.13.0
|
| 29 |
+
eva-decord==0.6.1
|
| 30 |
+
eval_type_backport==0.3.1
|
| 31 |
+
exceptiongroup==1.3.1
|
| 32 |
+
executing==2.2.1
|
| 33 |
+
fastjsonschema==2.21.2
|
| 34 |
+
fastparquet==2024.11.0
|
| 35 |
+
filelock==3.20.2
|
| 36 |
+
flash_attn==2.8.3
|
| 37 |
+
fonttools==4.61.1
|
| 38 |
+
fsspec==2025.12.0
|
| 39 |
+
future==0.18.2
|
| 40 |
+
fvcore==0.1.5.post20221221
|
| 41 |
+
gevent==25.9.1
|
| 42 |
+
gitdb==4.0.12
|
| 43 |
+
GitPython==3.1.46
|
| 44 |
+
glfw==2.10.0
|
| 45 |
+
greenlet==3.3.0
|
| 46 |
+
grpcio==1.76.0
|
| 47 |
+
gym==0.26.2
|
| 48 |
+
gym-notices==0.1.0
|
| 49 |
+
h11==0.16.0
|
| 50 |
+
hf-xet==1.2.0
|
| 51 |
+
hjson==3.1.0
|
| 52 |
+
httpcore==1.0.9
|
| 53 |
+
httpx==0.28.1
|
| 54 |
+
huggingface-hub==0.36.0
|
| 55 |
+
idna==3.11
|
| 56 |
+
ImageIO==2.37.2
|
| 57 |
+
importlib_metadata==8.7.1
|
| 58 |
+
importlib_resources==6.5.2
|
| 59 |
+
iniconfig==2.3.0
|
| 60 |
+
iopath==0.1.10
|
| 61 |
+
ipdb==0.13.13
|
| 62 |
+
ipython==8.37.0
|
| 63 |
+
jedi==0.19.2
|
| 64 |
+
Jinja2==3.1.6
|
| 65 |
+
jsonschema==4.17.3
|
| 66 |
+
jupyter_core==5.9.1
|
| 67 |
+
jupytext==1.18.1
|
| 68 |
+
kiwisolver==1.4.9
|
| 69 |
+
lazy_loader==0.4
|
| 70 |
+
libero==0.1.0
|
| 71 |
+
llvmlite==0.46.0
|
| 72 |
+
Markdown==3.10
|
| 73 |
+
markdown-it-py==4.0.0
|
| 74 |
+
MarkupSafe==3.0.3
|
| 75 |
+
matplotlib==3.10.8
|
| 76 |
+
matplotlib-inline==0.2.1
|
| 77 |
+
mdit-py-plugins==0.5.0
|
| 78 |
+
mdurl==0.1.2
|
| 79 |
+
mpmath==1.3.0
|
| 80 |
+
msgpack==1.1.2
|
| 81 |
+
mujoco==3.4.0
|
| 82 |
+
nbformat==5.10.4
|
| 83 |
+
networkx==3.4.2
|
| 84 |
+
ninja==1.13.0
|
| 85 |
+
numba==0.63.1
|
| 86 |
+
numpy==1.26.4
|
| 87 |
+
numpydantic==1.6.9
|
| 88 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 89 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 90 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 91 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 92 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 93 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 94 |
+
nvidia-curand-cu12==10.3.5.147
|
| 95 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 96 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 97 |
+
nvidia-nccl-cu12==2.21.5
|
| 98 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 99 |
+
nvidia-nvtx-cu12==12.4.127
|
| 100 |
+
omegaconf==2.3.0
|
| 101 |
+
opencv-python==4.11.0.86
|
| 102 |
+
opencv-python-headless==4.11.0.86
|
| 103 |
+
packaging==25.0
|
| 104 |
+
pandas==2.3.3
|
| 105 |
+
parso==0.8.5
|
| 106 |
+
pexpect==4.9.0
|
| 107 |
+
pillow==12.1.0
|
| 108 |
+
pipablepytorch3d==0.7.6
|
| 109 |
+
platformdirs==4.5.1
|
| 110 |
+
pluggy==1.6.0
|
| 111 |
+
portalocker==3.2.0
|
| 112 |
+
prompt_toolkit==3.0.52
|
| 113 |
+
protobuf==6.33.2
|
| 114 |
+
psutil==7.2.1
|
| 115 |
+
ptyprocess==0.7.0
|
| 116 |
+
pure_eval==0.2.3
|
| 117 |
+
py-cpuinfo==9.0.0
|
| 118 |
+
pyarrow==14.0.1
|
| 119 |
+
pydantic==2.10.6
|
| 120 |
+
pydantic_core==2.27.2
|
| 121 |
+
Pygments==2.19.2
|
| 122 |
+
PyOpenGL==3.1.10
|
| 123 |
+
pyparsing==3.3.1
|
| 124 |
+
pyrsistent==0.20.0
|
| 125 |
+
pytest==9.0.2
|
| 126 |
+
python-dateutil==2.9.0.post0
|
| 127 |
+
pytz==2025.2
|
| 128 |
+
PyYAML==6.0.3
|
| 129 |
+
qwen-vl-utils==0.0.14
|
| 130 |
+
regex==2025.11.3
|
| 131 |
+
requests==2.32.5
|
| 132 |
+
rich==14.2.0
|
| 133 |
+
robosuite==1.4.0
|
| 134 |
+
safetensors==0.7.0
|
| 135 |
+
scikit-image==0.25.2
|
| 136 |
+
scipy==1.15.3
|
| 137 |
+
sentry-sdk==2.48.0
|
| 138 |
+
setuptools==80.9.0
|
| 139 |
+
six==1.17.0
|
| 140 |
+
smmap==5.0.2
|
| 141 |
+
stack-data==0.6.3
|
| 142 |
+
starVLA==1.0.1
|
| 143 |
+
sympy==1.13.1
|
| 144 |
+
tabulate==0.9.0
|
| 145 |
+
tensorboard==2.20.0
|
| 146 |
+
tensorboard-data-server==0.7.2
|
| 147 |
+
termcolor==3.3.0
|
| 148 |
+
tifffile==2025.5.10
|
| 149 |
+
tiktoken==0.12.0
|
| 150 |
+
timm==1.0.22
|
| 151 |
+
tokenizers==0.22.1
|
| 152 |
+
tomli==2.3.0
|
| 153 |
+
torch==2.5.1
|
| 154 |
+
torchvision==0.20.1
|
| 155 |
+
tqdm==4.67.1
|
| 156 |
+
traitlets==5.14.3
|
| 157 |
+
transformers==4.57.3
|
| 158 |
+
transformers-stream-generator==0.0.4
|
| 159 |
+
triton==3.1.0
|
| 160 |
+
typeguard==4.4.4
|
| 161 |
+
typing_extensions==4.15.0
|
| 162 |
+
tyro==1.0.3
|
| 163 |
+
tzdata==2025.3
|
| 164 |
+
urllib3==2.6.2
|
| 165 |
+
wandb==0.23.1
|
| 166 |
+
wcwidth==0.2.14
|
| 167 |
+
websocket==0.2.1
|
| 168 |
+
websocket-client==1.8.0
|
| 169 |
+
websockets==15.0.1
|
| 170 |
+
Werkzeug==3.1.4
|
| 171 |
+
yacs==0.1.8
|
| 172 |
+
zipp==3.23.0
|
| 173 |
+
zope.event==6.1
|
| 174 |
+
zope.interface==8.1.1
|
| 175 |
+
autocommand==2.2.2
|
| 176 |
+
backports.tarfile==1.2.0
|
| 177 |
+
importlib_metadata==8.0.0
|
| 178 |
+
inflect==7.3.1
|
| 179 |
+
jaraco.collections==5.1.0
|
| 180 |
+
jaraco.context==5.3.0
|
| 181 |
+
jaraco.functools==4.0.1
|
| 182 |
+
jaraco.text==3.12.1
|
| 183 |
+
more-itertools==10.3.0
|
| 184 |
+
packaging==24.2
|
| 185 |
+
platformdirs==4.2.2
|
| 186 |
+
tomli==2.0.1
|
| 187 |
+
typeguard==4.3.0
|
| 188 |
+
typing_extensions==4.12.2
|
| 189 |
+
wheel==0.45.1
|
| 190 |
+
zipp==3.19.2
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,122 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36",
|
| 3 |
+
"python": "CPython 3.10.19",
|
| 4 |
+
"startedAt": "2026-01-17T10:03:39.069637Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--config_yaml",
|
| 7 |
+
"scripts/ER1_5/qwen3vl_bridge_rt1_gr00t.yaml",
|
| 8 |
+
"--framework.name",
|
| 9 |
+
"QwenGR00T",
|
| 10 |
+
"--framework.qwenvl.base_vlm",
|
| 11 |
+
"/home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9",
|
| 12 |
+
"--datasets.vla_data.data_root_dir",
|
| 13 |
+
"./playground/Datasets/OXE_LEROBOT",
|
| 14 |
+
"--datasets.vla_data.data_mix",
|
| 15 |
+
"bridge_rt_1",
|
| 16 |
+
"--datasets.vla_data.per_device_batch_size",
|
| 17 |
+
"8",
|
| 18 |
+
"--trainer.freeze_modules",
|
| 19 |
+
"--trainer.max_train_steps",
|
| 20 |
+
"100000",
|
| 21 |
+
"--trainer.save_interval",
|
| 22 |
+
"10000",
|
| 23 |
+
"--trainer.logging_frequency",
|
| 24 |
+
"50",
|
| 25 |
+
"--trainer.eval_interval",
|
| 26 |
+
"200",
|
| 27 |
+
"--run_root_dir",
|
| 28 |
+
"./Checkpoints",
|
| 29 |
+
"--run_id",
|
| 30 |
+
"qwen3vl_bridge_rt1_QwenGR00T_0117_1747",
|
| 31 |
+
"--output_dir",
|
| 32 |
+
"./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747",
|
| 33 |
+
"--wandb.project",
|
| 34 |
+
"Qwen3VL_Bridge_RT1_QwenGR00T",
|
| 35 |
+
"--wandb.entity",
|
| 36 |
+
"lookas"
|
| 37 |
+
],
|
| 38 |
+
"program": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py",
|
| 39 |
+
"codePath": "starVLA/training/train_starvla.py",
|
| 40 |
+
"codePathLocal": "starVLA/training/train_starvla.py",
|
| 41 |
+
"git": {
|
| 42 |
+
"remote": "https://github.com/hilookas/starVLA_pickxiguapi",
|
| 43 |
+
"commit": "ab531aff5b27795879c61f67892330a616e9dbf0"
|
| 44 |
+
},
|
| 45 |
+
"email": "hilookas@gmail.com",
|
| 46 |
+
"root": "./Checkpoints/qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb",
|
| 47 |
+
"host": "g340-cd51-7700-770-343f-3fec-69bb",
|
| 48 |
+
"executable": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3",
|
| 49 |
+
"cpu_count": 90,
|
| 50 |
+
"cpu_count_logical": 180,
|
| 51 |
+
"gpu": "NVIDIA H20",
|
| 52 |
+
"gpu_count": 8,
|
| 53 |
+
"disk": {
|
| 54 |
+
"/": {
|
| 55 |
+
"total": "3779301580800",
|
| 56 |
+
"used": "151673700352"
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"memory": {
|
| 60 |
+
"total": "2071188119552"
|
| 61 |
+
},
|
| 62 |
+
"gpu_nvidia": [
|
| 63 |
+
{
|
| 64 |
+
"name": "NVIDIA H20",
|
| 65 |
+
"memoryTotal": "102625181696",
|
| 66 |
+
"cudaCores": 9984,
|
| 67 |
+
"architecture": "Hopper",
|
| 68 |
+
"uuid": "GPU-f99bae5f-ffca-4972-6420-64c42ba64f22"
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"name": "NVIDIA H20",
|
| 72 |
+
"memoryTotal": "102625181696",
|
| 73 |
+
"cudaCores": 9984,
|
| 74 |
+
"architecture": "Hopper",
|
| 75 |
+
"uuid": "GPU-a00709c9-6bdf-4011-64dc-95421da94ba4"
|
| 76 |
+
},
|
| 77 |
+
{
|
| 78 |
+
"name": "NVIDIA H20",
|
| 79 |
+
"memoryTotal": "102625181696",
|
| 80 |
+
"cudaCores": 9984,
|
| 81 |
+
"architecture": "Hopper",
|
| 82 |
+
"uuid": "GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5"
|
| 83 |
+
},
|
| 84 |
+
{
|
| 85 |
+
"name": "NVIDIA H20",
|
| 86 |
+
"memoryTotal": "102625181696",
|
| 87 |
+
"cudaCores": 9984,
|
| 88 |
+
"architecture": "Hopper",
|
| 89 |
+
"uuid": "GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9"
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"name": "NVIDIA H20",
|
| 93 |
+
"memoryTotal": "102625181696",
|
| 94 |
+
"cudaCores": 9984,
|
| 95 |
+
"architecture": "Hopper",
|
| 96 |
+
"uuid": "GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218"
|
| 97 |
+
},
|
| 98 |
+
{
|
| 99 |
+
"name": "NVIDIA H20",
|
| 100 |
+
"memoryTotal": "102625181696",
|
| 101 |
+
"cudaCores": 9984,
|
| 102 |
+
"architecture": "Hopper",
|
| 103 |
+
"uuid": "GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde"
|
| 104 |
+
},
|
| 105 |
+
{
|
| 106 |
+
"name": "NVIDIA H20",
|
| 107 |
+
"memoryTotal": "102625181696",
|
| 108 |
+
"cudaCores": 9984,
|
| 109 |
+
"architecture": "Hopper",
|
| 110 |
+
"uuid": "GPU-4fa493fc-c408-182f-138e-bcc15c7f9138"
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "NVIDIA H20",
|
| 114 |
+
"memoryTotal": "102625181696",
|
| 115 |
+
"cudaCores": 9984,
|
| 116 |
+
"architecture": "Hopper",
|
| 117 |
+
"uuid": "GPU-16ef9185-6132-8620-ad2e-1f8920ded508"
|
| 118 |
+
}
|
| 119 |
+
],
|
| 120 |
+
"cudaVersion": "12.4",
|
| 121 |
+
"writerId": "qsdugxujhb6s3j19wae2dfqwajsgmsw2"
|
| 122 |
+
}
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"model_time":1.0015201809583232,"_wandb":{"runtime":115102},"data_time":0.002643669955432415,"epoch":0.85,"_step":100000,"_runtime":115102.355367037,"learning_rate":5e-07,"_timestamp":1.76875927504325e+09,"mse_score":0.007693730294704437,"action_dit_loss":0.05095190927386284}
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,89 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-17T18:03:45.356692165+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-17T18:03:48.552330417+08:00","level":"INFO","msg":"stream: created new stream","id":"xbap43rk"}
|
| 3 |
+
{"time":"2026-01-17T18:03:48.552524112+08:00","level":"INFO","msg":"handler: started","stream_id":"xbap43rk"}
|
| 4 |
+
{"time":"2026-01-17T18:03:48.577796615+08:00","level":"INFO","msg":"stream: started","id":"xbap43rk"}
|
| 5 |
+
{"time":"2026-01-17T18:03:48.577817586+08:00","level":"INFO","msg":"writer: started","stream_id":"xbap43rk"}
|
| 6 |
+
{"time":"2026-01-17T18:03:48.577832655+08:00","level":"INFO","msg":"sender: started","stream_id":"xbap43rk"}
|
| 7 |
+
{"time":"2026-01-17T20:02:17.852359064+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 8 |
+
{"time":"2026-01-17T20:04:33.007831623+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 9 |
+
{"time":"2026-01-17T20:35:32.863685268+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 10 |
+
{"time":"2026-01-17T22:03:46.318542143+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 11 |
+
{"time":"2026-01-17T22:48:34.635180932+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 12 |
+
{"time":"2026-01-17T22:55:57.518503703+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 13 |
+
{"time":"2026-01-17T23:07:48.293218261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 14 |
+
{"time":"2026-01-17T23:08:32.231325893+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-17T23:12:50.87203047+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 16 |
+
{"time":"2026-01-17T23:13:18.698788758+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": http2: client conn is closed"}
|
| 17 |
+
{"time":"2026-01-17T23:16:49.881636821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-01-17T23:25:00.472362504+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-01-18T00:16:02.236615436+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-01-18T00:33:00.268425846+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 21 |
+
{"time":"2026-01-18T00:33:13.186386827+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 22 |
+
{"time":"2026-01-18T02:52:45.26127457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 23 |
+
{"time":"2026-01-18T02:53:30.366178096+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 24 |
+
{"time":"2026-01-18T04:54:45.36780745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 25 |
+
{"time":"2026-01-18T04:55:30.238642915+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 26 |
+
{"time":"2026-01-18T04:55:42.722661208+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 27 |
+
{"time":"2026-01-18T04:56:15.382797183+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 28 |
+
{"time":"2026-01-18T08:43:45.342343851+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 29 |
+
{"time":"2026-01-18T08:44:00.358330288+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 30 |
+
{"time":"2026-01-18T08:44:30.251461638+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 31 |
+
{"time":"2026-01-18T10:47:45.345590419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 32 |
+
{"time":"2026-01-18T12:47:15.286316861+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 33 |
+
{"time":"2026-01-18T13:40:46.383240786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 34 |
+
{"time":"2026-01-18T16:22:00.269227917+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 35 |
+
{"time":"2026-01-18T16:23:00.259212087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 36 |
+
{"time":"2026-01-18T16:26:15.279544821+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 37 |
+
{"time":"2026-01-18T16:28:15.394951264+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 38 |
+
{"time":"2026-01-18T16:28:28.376139107+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 39 |
+
{"time":"2026-01-18T16:32:34.771745298+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 40 |
+
{"time":"2026-01-18T16:32:50.854108579+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 41 |
+
{"time":"2026-01-18T16:33:15.253909146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 42 |
+
{"time":"2026-01-18T16:33:30.268871735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 43 |
+
{"time":"2026-01-18T16:33:45.254149217+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 44 |
+
{"time":"2026-01-18T16:33:57.84608755+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 45 |
+
{"time":"2026-01-18T16:34:14.118425621+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 46 |
+
{"time":"2026-01-18T16:34:26.791643445+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 47 |
+
{"time":"2026-01-18T16:35:30.392649391+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 48 |
+
{"time":"2026-01-18T16:35:45.390391138+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 49 |
+
{"time":"2026-01-18T16:37:00.231753869+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 50 |
+
{"time":"2026-01-18T16:39:00.308923433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 51 |
+
{"time":"2026-01-18T16:50:44.109993399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 52 |
+
{"time":"2026-01-18T16:56:44.222721195+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 53 |
+
{"time":"2026-01-18T16:56:59.182350472+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 54 |
+
{"time":"2026-01-18T16:57:12.200012616+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 55 |
+
{"time":"2026-01-18T16:57:30.278294605+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 56 |
+
{"time":"2026-01-18T16:57:45.272613563+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 57 |
+
{"time":"2026-01-18T16:57:58.361466419+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 58 |
+
{"time":"2026-01-18T16:58:16.374502713+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 59 |
+
{"time":"2026-01-18T17:01:49.770643385+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 60 |
+
{"time":"2026-01-18T17:03:00.288457229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 61 |
+
{"time":"2026-01-18T17:03:45.353334974+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 62 |
+
{"time":"2026-01-18T18:17:45.365055726+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 63 |
+
{"time":"2026-01-18T18:24:00.357867283+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 64 |
+
{"time":"2026-01-18T19:06:15.375047877+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 65 |
+
{"time":"2026-01-18T19:06:28.413756607+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 66 |
+
{"time":"2026-01-18T19:15:30.232002999+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 67 |
+
{"time":"2026-01-18T19:39:30.251864251+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 68 |
+
{"time":"2026-01-18T19:40:00.288831216+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 69 |
+
{"time":"2026-01-18T19:52:30.252619907+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 70 |
+
{"time":"2026-01-18T20:51:49.773485296+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 71 |
+
{"time":"2026-01-18T21:32:54.188737252+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 72 |
+
{"time":"2026-01-18T22:14:31.789385651+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": unexpected EOF"}
|
| 73 |
+
{"time":"2026-01-19T00:11:15.393839366+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 74 |
+
{"time":"2026-01-19T00:50:30.380524837+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 75 |
+
{"time":"2026-01-19T00:51:00.395000654+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 76 |
+
{"time":"2026-01-19T00:51:13.162530742+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 77 |
+
{"time":"2026-01-19T00:54:30.249839041+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 78 |
+
{"time":"2026-01-19T00:55:30.349433303+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 79 |
+
{"time":"2026-01-19T01:00:31.333972122+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 80 |
+
{"time":"2026-01-19T01:19:30.367251508+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 81 |
+
{"time":"2026-01-19T01:20:30.296201955+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 82 |
+
{"time":"2026-01-19T01:51:00.221611746+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 83 |
+
{"time":"2026-01-19T01:52:30.445846213+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_GR00T/xbap43rk/file_stream\": EOF"}
|
| 84 |
+
{"time":"2026-01-19T02:02:15.651403576+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 85 |
+
{"time":"2026-01-19T02:02:17.343084437+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
|
| 86 |
+
{"time":"2026-01-19T02:02:17.352284781+08:00","level":"INFO","msg":"stream: closing","id":"xbap43rk"}
|
| 87 |
+
{"time":"2026-01-19T02:02:17.35229661+08:00","level":"INFO","msg":"handler: closed","stream_id":"xbap43rk"}
|
| 88 |
+
{"time":"2026-01-19T02:02:17.384196864+08:00","level":"INFO","msg":"sender: closed","stream_id":"xbap43rk"}
|
| 89 |
+
{"time":"2026-01-19T02:02:17.384209276+08:00","level":"INFO","msg":"stream: closed","id":"xbap43rk"}
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/logs/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenGR00T_0117_1747/wandb/wandb/run-20260117_180339-xbap43rk/run-xbap43rk.wandb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7eb50f80f1190a86e2744977be0372f4150f63c16e050177b613fb7d1e84338
|
| 3 |
+
size 110227380
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/config.yaml
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
datasets:
|
| 2 |
+
vla_data:
|
| 3 |
+
CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
|
| 4 |
+
Locate their bounding boxes in [x1,y1,x2,y2] format.
|
| 5 |
+
data_mix: bridge_rt_1
|
| 6 |
+
data_root_dir: ./playground/Datasets/OXE_LEROBOT
|
| 7 |
+
dataset_py: lerobot_datasets
|
| 8 |
+
image_size:
|
| 9 |
+
- 224
|
| 10 |
+
- 224
|
| 11 |
+
per_device_batch_size: 8
|
| 12 |
+
video_backend: torchvision_av
|
| 13 |
+
framework:
|
| 14 |
+
action_model:
|
| 15 |
+
action_dim: 7
|
| 16 |
+
action_hidden_dim: 4096
|
| 17 |
+
action_model_type: DiT-B
|
| 18 |
+
future_action_window_size: 15
|
| 19 |
+
past_action_window_size: 0
|
| 20 |
+
name: QwenOFT
|
| 21 |
+
qwenvl:
|
| 22 |
+
base_vlm: /home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
|
| 23 |
+
output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323
|
| 24 |
+
run_id: qwen3vl_bridge_rt1_QwenOFT_0112_1323
|
| 25 |
+
run_root_dir: ./Checkpoints
|
| 26 |
+
seed: 42
|
| 27 |
+
trainer:
|
| 28 |
+
eval_interval: 200
|
| 29 |
+
freeze_modules: true
|
| 30 |
+
gradient_accumulation_steps: 1
|
| 31 |
+
gradient_clipping: 1.0
|
| 32 |
+
is_resume: false
|
| 33 |
+
learning_rate:
|
| 34 |
+
action_model: 0.0001
|
| 35 |
+
base: 1.0e-05
|
| 36 |
+
qwen_vl_interface: 1.0e-05
|
| 37 |
+
logging_frequency: 50
|
| 38 |
+
lr_scheduler_type: cosine_with_min_lr
|
| 39 |
+
max_train_steps: 100000
|
| 40 |
+
num_warmup_steps: 10000
|
| 41 |
+
optimizer:
|
| 42 |
+
betas:
|
| 43 |
+
- 0.9
|
| 44 |
+
- 0.95
|
| 45 |
+
eps: 1.0e-08
|
| 46 |
+
weight_decay: 1.0e-08
|
| 47 |
+
save_interval: 10000
|
| 48 |
+
scheduler_specific_kwargs:
|
| 49 |
+
min_lr: 5.0e-07
|
| 50 |
+
wandb_entity: lookas
|
| 51 |
+
wandb_project: Qwen3VL_Bridge_RT1_OFT
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/dataset_statistics.json
ADDED
|
@@ -0,0 +1,264 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"oxe_bridge": {
|
| 3 |
+
"action": {
|
| 4 |
+
"mean": [
|
| 5 |
+
0.00011365935642970726,
|
| 6 |
+
6.556110747624189e-05,
|
| 7 |
+
-6.320965621853247e-05,
|
| 8 |
+
-7.205353176686913e-05,
|
| 9 |
+
-0.00019515302847139537,
|
| 10 |
+
0.0001203166029881686,
|
| 11 |
+
0.28829458355903625
|
| 12 |
+
],
|
| 13 |
+
"std": [
|
| 14 |
+
0.006909770731857718,
|
| 15 |
+
0.009684093232852218,
|
| 16 |
+
0.00896290498528129,
|
| 17 |
+
0.020121052930683073,
|
| 18 |
+
0.021582655517295487,
|
| 19 |
+
0.054723342223346974,
|
| 20 |
+
0.4543627821514982
|
| 21 |
+
],
|
| 22 |
+
"max": [
|
| 23 |
+
0.41691166162490845,
|
| 24 |
+
0.25864794850349426,
|
| 25 |
+
0.21218234300613403,
|
| 26 |
+
3.122201919555664,
|
| 27 |
+
1.8618112802505493,
|
| 28 |
+
6.272472858428955,
|
| 29 |
+
1.0
|
| 30 |
+
],
|
| 31 |
+
"min": [
|
| 32 |
+
-0.4007510244846344,
|
| 33 |
+
-0.13874775171279907,
|
| 34 |
+
-0.22553899884223938,
|
| 35 |
+
-3.2010786533355713,
|
| 36 |
+
-1.8618112802505493,
|
| 37 |
+
-6.279075622558594,
|
| 38 |
+
0.0
|
| 39 |
+
],
|
| 40 |
+
"q01": [
|
| 41 |
+
-0.02875255048274994,
|
| 42 |
+
-0.04170213546603918,
|
| 43 |
+
-0.026096721179783344,
|
| 44 |
+
-0.08052874729037285,
|
| 45 |
+
-0.09249906800687313,
|
| 46 |
+
-0.20738555490970612,
|
| 47 |
+
0.0
|
| 48 |
+
],
|
| 49 |
+
"q99": [
|
| 50 |
+
0.028306663036346436,
|
| 51 |
+
0.04089853074401617,
|
| 52 |
+
0.0401805154979229,
|
| 53 |
+
0.08173403143882751,
|
| 54 |
+
0.07760760560631752,
|
| 55 |
+
0.2038465365767479,
|
| 56 |
+
1.0
|
| 57 |
+
],
|
| 58 |
+
"mask": [
|
| 59 |
+
true,
|
| 60 |
+
true,
|
| 61 |
+
true,
|
| 62 |
+
true,
|
| 63 |
+
true,
|
| 64 |
+
true,
|
| 65 |
+
false
|
| 66 |
+
]
|
| 67 |
+
},
|
| 68 |
+
"state": {
|
| 69 |
+
"mean": [
|
| 70 |
+
0.15471743047237396,
|
| 71 |
+
0.015362550504505634,
|
| 72 |
+
0.03222028166055679,
|
| 73 |
+
0.0032453201711177826,
|
| 74 |
+
-0.038600146770477295,
|
| 75 |
+
0.05382946878671646,
|
| 76 |
+
0.0,
|
| 77 |
+
0.35406652092933655
|
| 78 |
+
],
|
| 79 |
+
"std": [
|
| 80 |
+
0.1605359274864927,
|
| 81 |
+
0.06677912092232112,
|
| 82 |
+
0.048657150951527554,
|
| 83 |
+
0.09275336958940797,
|
| 84 |
+
0.12566984746914736,
|
| 85 |
+
0.41222738578801793,
|
| 86 |
+
0.0,
|
| 87 |
+
0.4330223535305803
|
| 88 |
+
],
|
| 89 |
+
"max": [
|
| 90 |
+
0.5862360596656799,
|
| 91 |
+
0.4034728705883026,
|
| 92 |
+
0.3568263053894043,
|
| 93 |
+
1.3517684936523438,
|
| 94 |
+
1.570796251296997,
|
| 95 |
+
3.141204357147217,
|
| 96 |
+
0.0,
|
| 97 |
+
1.1121242046356201
|
| 98 |
+
],
|
| 99 |
+
"min": [
|
| 100 |
+
-0.04167502000927925,
|
| 101 |
+
-0.3563207685947418,
|
| 102 |
+
-0.15537554025650024,
|
| 103 |
+
-3.141592502593994,
|
| 104 |
+
-1.4992541074752808,
|
| 105 |
+
-3.14153790473938,
|
| 106 |
+
0.0,
|
| 107 |
+
0.04637829214334488
|
| 108 |
+
],
|
| 109 |
+
"q01": [
|
| 110 |
+
0.17102622985839844,
|
| 111 |
+
-0.1698118858039379,
|
| 112 |
+
-0.055632163770496845,
|
| 113 |
+
-0.36493172496557236,
|
| 114 |
+
-0.541871190071106,
|
| 115 |
+
-1.354275494813919,
|
| 116 |
+
0.0,
|
| 117 |
+
0.052190229296684265
|
| 118 |
+
],
|
| 119 |
+
"q99": [
|
| 120 |
+
0.45322076976299286,
|
| 121 |
+
0.2354845181107521,
|
| 122 |
+
0.19489620998501778,
|
| 123 |
+
0.3780156075954437,
|
| 124 |
+
0.27568644285202026,
|
| 125 |
+
1.8500566184520721,
|
| 126 |
+
0.0,
|
| 127 |
+
1.0105689764022827
|
| 128 |
+
]
|
| 129 |
+
},
|
| 130 |
+
"num_transitions": 1305714,
|
| 131 |
+
"num_trajectories": 53192
|
| 132 |
+
},
|
| 133 |
+
"oxe_rt1": {
|
| 134 |
+
"action": {
|
| 135 |
+
"mean": [
|
| 136 |
+
0.003493750700727105,
|
| 137 |
+
0.003132961690425873,
|
| 138 |
+
-0.0063125672750175,
|
| 139 |
+
0.02166595682501793,
|
| 140 |
+
-0.0028780836146324873,
|
| 141 |
+
0.0004565489653032273,
|
| 142 |
+
0.26771023869514465
|
| 143 |
+
],
|
| 144 |
+
"std": [
|
| 145 |
+
0.049065014465362655,
|
| 146 |
+
0.04229853739828572,
|
| 147 |
+
0.05237628880142378,
|
| 148 |
+
0.1124860236500875,
|
| 149 |
+
0.09312952783816872,
|
| 150 |
+
0.10319098309601091,
|
| 151 |
+
0.4418448662622395
|
| 152 |
+
],
|
| 153 |
+
"max": [
|
| 154 |
+
2.9984593391418457,
|
| 155 |
+
22.09052848815918,
|
| 156 |
+
2.7507524490356445,
|
| 157 |
+
1.570636510848999,
|
| 158 |
+
1.5321086645126343,
|
| 159 |
+
1.5691522359848022,
|
| 160 |
+
1.0
|
| 161 |
+
],
|
| 162 |
+
"min": [
|
| 163 |
+
-2.0204520225524902,
|
| 164 |
+
-5.497899532318115,
|
| 165 |
+
-2.031663417816162,
|
| 166 |
+
-1.569917917251587,
|
| 167 |
+
-1.569892168045044,
|
| 168 |
+
-1.570419430732727,
|
| 169 |
+
0.0
|
| 170 |
+
],
|
| 171 |
+
"q01": [
|
| 172 |
+
-0.22453527510166169,
|
| 173 |
+
-0.14820013284683228,
|
| 174 |
+
-0.231589707583189,
|
| 175 |
+
-0.3517994859814644,
|
| 176 |
+
-0.4193011274933815,
|
| 177 |
+
-0.43643461108207704,
|
| 178 |
+
0.0
|
| 179 |
+
],
|
| 180 |
+
"q99": [
|
| 181 |
+
0.17824687153100965,
|
| 182 |
+
0.14938379630446405,
|
| 183 |
+
0.21842354819178575,
|
| 184 |
+
0.5892666035890578,
|
| 185 |
+
0.35272657424211445,
|
| 186 |
+
0.44796681255102094,
|
| 187 |
+
1.0
|
| 188 |
+
],
|
| 189 |
+
"mask": [
|
| 190 |
+
true,
|
| 191 |
+
true,
|
| 192 |
+
true,
|
| 193 |
+
true,
|
| 194 |
+
true,
|
| 195 |
+
true,
|
| 196 |
+
false
|
| 197 |
+
]
|
| 198 |
+
},
|
| 199 |
+
"state": {
|
| 200 |
+
"mean": [
|
| 201 |
+
0.2799473702907562,
|
| 202 |
+
-0.04167069122195244,
|
| 203 |
+
0.38854750990867615,
|
| 204 |
+
0.21306729316711426,
|
| 205 |
+
-0.12402277439832687,
|
| 206 |
+
0.24756911396980286,
|
| 207 |
+
0.046330634504556656,
|
| 208 |
+
0.10487449914216995
|
| 209 |
+
],
|
| 210 |
+
"std": [
|
| 211 |
+
0.29342642876909925,
|
| 212 |
+
0.09174024655686211,
|
| 213 |
+
0.42569508885539115,
|
| 214 |
+
0.38616252611341306,
|
| 215 |
+
0.38314586427420927,
|
| 216 |
+
0.44433568806919804,
|
| 217 |
+
0.1263927443679382,
|
| 218 |
+
0.22122596673781084
|
| 219 |
+
],
|
| 220 |
+
"max": [
|
| 221 |
+
1.0534898042678833,
|
| 222 |
+
0.48018959164619446,
|
| 223 |
+
1.6896663904190063,
|
| 224 |
+
1.0,
|
| 225 |
+
0.9999993443489075,
|
| 226 |
+
0.9999874830245972,
|
| 227 |
+
0.9554369449615479,
|
| 228 |
+
0.9914546012878418
|
| 229 |
+
],
|
| 230 |
+
"min": [
|
| 231 |
+
-0.4436439275741577,
|
| 232 |
+
-0.9970501065254211,
|
| 233 |
+
-0.006579156965017319,
|
| 234 |
+
0.0,
|
| 235 |
+
-0.8643477559089661,
|
| 236 |
+
-0.7079970240592957,
|
| 237 |
+
-0.7688722014427185,
|
| 238 |
+
-0.4999994933605194
|
| 239 |
+
],
|
| 240 |
+
"q01": [
|
| 241 |
+
0.32481380939483645,
|
| 242 |
+
-0.28334290891885755,
|
| 243 |
+
0.14107070609927178,
|
| 244 |
+
0.0,
|
| 245 |
+
-0.686474204659462,
|
| 246 |
+
-0.6808923494815826,
|
| 247 |
+
-0.36045596331357954,
|
| 248 |
+
-0.454380963742733
|
| 249 |
+
],
|
| 250 |
+
"q99": [
|
| 251 |
+
0.8750156319141384,
|
| 252 |
+
0.21247054174542404,
|
| 253 |
+
1.0727112340927123,
|
| 254 |
+
1.0,
|
| 255 |
+
0.9377871316671368,
|
| 256 |
+
0.9563051050901409,
|
| 257 |
+
0.45990042358636823,
|
| 258 |
+
0.7216041100025177
|
| 259 |
+
]
|
| 260 |
+
},
|
| 261 |
+
"num_transitions": 3786152,
|
| 262 |
+
"num_trajectories": 87212
|
| 263 |
+
}
|
| 264 |
+
}
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/run_qwen3vl_bridge_rt1_qwen_oft.sh
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Framework_name=QwenOFT
|
| 2 |
+
dit_type="DiT-B"
|
| 3 |
+
freeze_module_list='' # fully FT, e.g., freeze_module_list=""
|
| 4 |
+
data_mix=bridge_rt_1
|
| 5 |
+
|
| 6 |
+
## Modify below paths before running ##
|
| 7 |
+
date_time=$(date +%m%d_%H%M)
|
| 8 |
+
config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
|
| 9 |
+
base_vlm=/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
|
| 10 |
+
data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
|
| 11 |
+
run_root_dir=./Checkpoints
|
| 12 |
+
run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
|
| 13 |
+
batch_size=8
|
| 14 |
+
wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
|
| 15 |
+
wandb_entity=lookas
|
| 16 |
+
|
| 17 |
+
# export WANDB_MODE=disabled
|
| 18 |
+
|
| 19 |
+
output_dir=${run_root_dir}/${run_id}
|
| 20 |
+
mkdir -p ${output_dir}
|
| 21 |
+
cp $0 ${output_dir}/
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
accelerate launch --main_process_port 12773 \
|
| 25 |
+
--config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 26 |
+
--num_processes 8 \
|
| 27 |
+
starVLA/training/train_starvla.py \
|
| 28 |
+
--config_yaml ${config_yaml} \
|
| 29 |
+
--framework.name ${Framework_name} \
|
| 30 |
+
--framework.qwenvl.base_vlm ${base_vlm} \
|
| 31 |
+
--datasets.vla_data.data_root_dir ${data_root_dir}\
|
| 32 |
+
--datasets.vla_data.data_mix ${data_mix} \
|
| 33 |
+
--datasets.vla_data.per_device_batch_size ${batch_size} \
|
| 34 |
+
--trainer.freeze_modules ${freeze_module_list} \
|
| 35 |
+
--trainer.max_train_steps 100000 \
|
| 36 |
+
--trainer.save_interval 10000 \
|
| 37 |
+
--trainer.logging_frequency 50 \
|
| 38 |
+
--trainer.eval_interval 200 \
|
| 39 |
+
--run_root_dir ${run_root_dir} \
|
| 40 |
+
--run_id ${run_id} \
|
| 41 |
+
--output_dir ${output_dir} \
|
| 42 |
+
--wandb.project ${wandb_project} \
|
| 43 |
+
--wandb.entity ${wandb_entity}
|
| 44 |
+
|
| 45 |
+
|
| 46 |
+
# multi-node launch example
|
| 47 |
+
|
| 48 |
+
# accelerate launch \
|
| 49 |
+
# --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 50 |
+
# --main_process_ip $MASTER_ADDR \
|
| 51 |
+
# --main_process_port $MASTER_PORT \
|
| 52 |
+
# --machine_rank $SLURM_PROCID \
|
| 53 |
+
# --num_machines $SLURM_NNODES \
|
| 54 |
+
# --num_processes=${TOTAL_GPUS} \
|
| 55 |
+
# starVLA/training/train_starvla.py \
|
| 56 |
+
# --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
|
| 57 |
+
# --framework.framework_py QwenGR00T \
|
| 58 |
+
# --framework.qwenvl.base_vlm microsoft/Florence-2-large \
|
| 59 |
+
# --run_root_dir ${run_root_dir} \
|
| 60 |
+
# --run_id ${run_id} \
|
| 61 |
+
# --wandb_project your_project \
|
| 62 |
+
# --wandb_entity your_name
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/summary.jsonl
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"steps": 10000}
|
| 2 |
+
{"steps": 20000}
|
| 3 |
+
{"steps": 30000}
|
| 4 |
+
{"steps": 40000}
|
| 5 |
+
{"steps": 50000}
|
| 6 |
+
{"steps": 60000}
|
| 7 |
+
{"steps": 70000}
|
| 8 |
+
{"steps": 80000}
|
| 9 |
+
{"steps": 90000}
|
| 10 |
+
{"steps": 100000}
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug-internal.log
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-12T13:33:02.374820947+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-12T13:33:03.82154982+08:00","level":"INFO","msg":"stream: created new stream","id":"ueywjhk5"}
|
| 3 |
+
{"time":"2026-01-12T13:33:03.821725323+08:00","level":"INFO","msg":"handler: started","stream_id":"ueywjhk5"}
|
| 4 |
+
{"time":"2026-01-12T13:33:03.846752186+08:00","level":"INFO","msg":"stream: started","id":"ueywjhk5"}
|
| 5 |
+
{"time":"2026-01-12T13:33:03.846770681+08:00","level":"INFO","msg":"writer: started","stream_id":"ueywjhk5"}
|
| 6 |
+
{"time":"2026-01-12T13:33:03.846770288+08:00","level":"INFO","msg":"sender: started","stream_id":"ueywjhk5"}
|
| 7 |
+
{"time":"2026-01-12T14:18:31.589248229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 8 |
+
{"time":"2026-01-12T14:39:00.33374833+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 9 |
+
{"time":"2026-01-12T14:45:00.196854395+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 10 |
+
{"time":"2026-01-12T15:30:49.608798424+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": net/http: request canceled while waiting for connection (Client.Timeout exceeded while awaiting headers)"}
|
| 11 |
+
{"time":"2026-01-12T15:58:15.168936649+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 12 |
+
{"time":"2026-01-12T16:32:15.169856477+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 13 |
+
{"time":"2026-01-12T16:32:28.120660769+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 14 |
+
{"time":"2026-01-12T18:52:15.110123119+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-12T20:25:15.093766297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 16 |
+
{"time":"2026-01-12T20:46:29.622105415+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": Gateway Timeout"}
|
| 17 |
+
{"time":"2026-01-12T20:57:51.676789447+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-01-12T21:34:03.873286543+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-01-12T21:57:16.546518785+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-01-12T22:29:15.864952943+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 21 |
+
{"time":"2026-01-12T22:36:13.618868987+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 22 |
+
{"time":"2026-01-12T22:36:31.272703076+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 23 |
+
{"time":"2026-01-13T00:17:45.174009838+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 24 |
+
{"time":"2026-01-13T00:17:57.789671331+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 25 |
+
{"time":"2026-01-13T00:18:45.160525879+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 26 |
+
{"time":"2026-01-13T01:22:18.006447633+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 27 |
+
{"time":"2026-01-13T02:03:21.340298852+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 28 |
+
{"time":"2026-01-13T03:04:34.668877357+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 29 |
+
{"time":"2026-01-13T03:04:47.661210297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 30 |
+
{"time":"2026-01-13T03:12:30.235091077+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 31 |
+
{"time":"2026-01-13T03:13:15.087092941+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 32 |
+
{"time":"2026-01-13T05:33:30.27306441+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 33 |
+
{"time":"2026-01-13T05:33:45.195585087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 34 |
+
{"time":"2026-01-13T05:34:15.047256192+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 35 |
+
{"time":"2026-01-13T06:34:30.165692234+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 36 |
+
{"time":"2026-01-13T06:34:42.845804108+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 37 |
+
{"time":"2026-01-13T06:34:59.430634519+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 38 |
+
{"time":"2026-01-13T06:35:45.090534347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 39 |
+
{"time":"2026-01-13T06:38:45.24671956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 40 |
+
{"time":"2026-01-13T06:40:00.085760676+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 41 |
+
{"time":"2026-01-13T06:40:30.253594276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 42 |
+
{"time":"2026-01-13T06:40:45.119737819+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 43 |
+
{"time":"2026-01-13T06:41:01.006178451+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 44 |
+
{"time":"2026-01-13T09:01:01.259781836+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 45 |
+
{"time":"2026-01-13T10:20:27.160154786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 46 |
+
{"time":"2026-01-13T11:23:00.198050425+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 47 |
+
{"time":"2026-01-13T11:24:00.137963825+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 48 |
+
{"time":"2026-01-13T11:41:16.643086394+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 49 |
+
{"time":"2026-01-13T12:21:36.803454674+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 50 |
+
{"time":"2026-01-13T12:29:23.122571501+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 51 |
+
{"time":"2026-01-13T12:59:15.208303261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 52 |
+
{"time":"2026-01-13T13:06:15.210877761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 53 |
+
{"time":"2026-01-13T13:06:27.856833979+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 54 |
+
{"time":"2026-01-13T13:09:06.355015154+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 55 |
+
{"time":"2026-01-13T13:40:00.126142378+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 56 |
+
{"time":"2026-01-13T13:46:32.168389695+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 57 |
+
{"time":"2026-01-13T13:48:15.081349554+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 58 |
+
{"time":"2026-01-13T13:57:00.197403381+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 59 |
+
{"time":"2026-01-13T15:57:25.317460174+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 60 |
+
{"time":"2026-01-13T15:59:46.726236225+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 61 |
+
{"time":"2026-01-13T16:09:46.448847236+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 62 |
+
{"time":"2026-01-13T16:58:01.095875797+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 63 |
+
{"time":"2026-01-13T17:24:10.021730043+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 64 |
+
{"time":"2026-01-13T18:27:15.075407399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 65 |
+
{"time":"2026-01-13T18:36:00.080917996+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 66 |
+
{"time":"2026-01-13T18:36:30.217018153+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 67 |
+
{"time":"2026-01-13T18:38:00.137187254+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 68 |
+
{"time":"2026-01-13T18:54:07.673379631+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 69 |
+
{"time":"2026-01-13T19:07:00.253334334+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 70 |
+
{"time":"2026-01-13T19:15:30.09514757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 71 |
+
{"time":"2026-01-13T20:25:51.505745758+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 72 |
+
{"time":"2026-01-13T21:59:51.560168548+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 73 |
+
{"time":"2026-01-13T23:25:27.580587803+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 74 |
+
{"time":"2026-01-13T23:25:28.86707285+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
|
| 75 |
+
{"time":"2026-01-13T23:25:28.876898999+08:00","level":"INFO","msg":"stream: closing","id":"ueywjhk5"}
|
| 76 |
+
{"time":"2026-01-13T23:25:28.876914442+08:00","level":"INFO","msg":"handler: closed","stream_id":"ueywjhk5"}
|
| 77 |
+
{"time":"2026-01-13T23:25:28.90868024+08:00","level":"INFO","msg":"sender: closed","stream_id":"ueywjhk5"}
|
| 78 |
+
{"time":"2026-01-13T23:25:28.90870897+08:00","level":"INFO","msg":"stream: closed","id":"ueywjhk5"}
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/config.yaml
ADDED
|
@@ -0,0 +1,133 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_wandb:
|
| 2 |
+
value:
|
| 3 |
+
cli_version: 0.23.1
|
| 4 |
+
e:
|
| 5 |
+
3h4xzexd9mhzcjwlbp7j0zfzyqq963et:
|
| 6 |
+
args:
|
| 7 |
+
- --config_yaml
|
| 8 |
+
- scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
|
| 9 |
+
- --framework.name
|
| 10 |
+
- QwenOFT
|
| 11 |
+
- --framework.qwenvl.base_vlm
|
| 12 |
+
- /home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b
|
| 13 |
+
- --datasets.vla_data.data_root_dir
|
| 14 |
+
- ./playground/Datasets/OXE_LEROBOT
|
| 15 |
+
- --datasets.vla_data.data_mix
|
| 16 |
+
- bridge_rt_1
|
| 17 |
+
- --datasets.vla_data.per_device_batch_size
|
| 18 |
+
- "8"
|
| 19 |
+
- --trainer.freeze_modules
|
| 20 |
+
- --trainer.max_train_steps
|
| 21 |
+
- "100000"
|
| 22 |
+
- --trainer.save_interval
|
| 23 |
+
- "10000"
|
| 24 |
+
- --trainer.logging_frequency
|
| 25 |
+
- "50"
|
| 26 |
+
- --trainer.eval_interval
|
| 27 |
+
- "200"
|
| 28 |
+
- --run_root_dir
|
| 29 |
+
- ./Checkpoints
|
| 30 |
+
- --run_id
|
| 31 |
+
- qwen3vl_bridge_rt1_QwenOFT_0112_1323
|
| 32 |
+
- --output_dir
|
| 33 |
+
- ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323
|
| 34 |
+
- --wandb.project
|
| 35 |
+
- Qwen3VL_Bridge_RT1_QwenOFT
|
| 36 |
+
- --wandb.entity
|
| 37 |
+
- lookas
|
| 38 |
+
codePath: starVLA/training/train_starvla.py
|
| 39 |
+
codePathLocal: starVLA/training/train_starvla.py
|
| 40 |
+
cpu_count: 90
|
| 41 |
+
cpu_count_logical: 180
|
| 42 |
+
cudaVersion: "12.4"
|
| 43 |
+
disk:
|
| 44 |
+
/:
|
| 45 |
+
total: "3779301580800"
|
| 46 |
+
used: "159098298368"
|
| 47 |
+
email: hilookas@gmail.com
|
| 48 |
+
executable: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3
|
| 49 |
+
git:
|
| 50 |
+
commit: ab531aff5b27795879c61f67892330a616e9dbf0
|
| 51 |
+
remote: https://github.com/hilookas/starVLA_pickxiguapi
|
| 52 |
+
gpu: NVIDIA H20
|
| 53 |
+
gpu_count: 8
|
| 54 |
+
gpu_nvidia:
|
| 55 |
+
- architecture: Hopper
|
| 56 |
+
cudaCores: 9984
|
| 57 |
+
memoryTotal: "102625181696"
|
| 58 |
+
name: NVIDIA H20
|
| 59 |
+
uuid: GPU-f99bae5f-ffca-4972-6420-64c42ba64f22
|
| 60 |
+
- architecture: Hopper
|
| 61 |
+
cudaCores: 9984
|
| 62 |
+
memoryTotal: "102625181696"
|
| 63 |
+
name: NVIDIA H20
|
| 64 |
+
uuid: GPU-a00709c9-6bdf-4011-64dc-95421da94ba4
|
| 65 |
+
- architecture: Hopper
|
| 66 |
+
cudaCores: 9984
|
| 67 |
+
memoryTotal: "102625181696"
|
| 68 |
+
name: NVIDIA H20
|
| 69 |
+
uuid: GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5
|
| 70 |
+
- architecture: Hopper
|
| 71 |
+
cudaCores: 9984
|
| 72 |
+
memoryTotal: "102625181696"
|
| 73 |
+
name: NVIDIA H20
|
| 74 |
+
uuid: GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9
|
| 75 |
+
- architecture: Hopper
|
| 76 |
+
cudaCores: 9984
|
| 77 |
+
memoryTotal: "102625181696"
|
| 78 |
+
name: NVIDIA H20
|
| 79 |
+
uuid: GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218
|
| 80 |
+
- architecture: Hopper
|
| 81 |
+
cudaCores: 9984
|
| 82 |
+
memoryTotal: "102625181696"
|
| 83 |
+
name: NVIDIA H20
|
| 84 |
+
uuid: GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde
|
| 85 |
+
- architecture: Hopper
|
| 86 |
+
cudaCores: 9984
|
| 87 |
+
memoryTotal: "102625181696"
|
| 88 |
+
name: NVIDIA H20
|
| 89 |
+
uuid: GPU-4fa493fc-c408-182f-138e-bcc15c7f9138
|
| 90 |
+
- architecture: Hopper
|
| 91 |
+
cudaCores: 9984
|
| 92 |
+
memoryTotal: "102625181696"
|
| 93 |
+
name: NVIDIA H20
|
| 94 |
+
uuid: GPU-16ef9185-6132-8620-ad2e-1f8920ded508
|
| 95 |
+
host: g340-cd51-7700-770-343f-3fec-69bb
|
| 96 |
+
memory:
|
| 97 |
+
total: "2071188119552"
|
| 98 |
+
os: Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36
|
| 99 |
+
program: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py
|
| 100 |
+
python: CPython 3.10.19
|
| 101 |
+
root: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb
|
| 102 |
+
startedAt: "2026-01-12T05:32:56.070975Z"
|
| 103 |
+
writerId: 3h4xzexd9mhzcjwlbp7j0zfzyqq963et
|
| 104 |
+
m: []
|
| 105 |
+
python_version: 3.10.19
|
| 106 |
+
t:
|
| 107 |
+
"1":
|
| 108 |
+
- 1
|
| 109 |
+
- 11
|
| 110 |
+
- 41
|
| 111 |
+
- 49
|
| 112 |
+
- 63
|
| 113 |
+
- 71
|
| 114 |
+
- 80
|
| 115 |
+
- 83
|
| 116 |
+
"2":
|
| 117 |
+
- 1
|
| 118 |
+
- 11
|
| 119 |
+
- 41
|
| 120 |
+
- 49
|
| 121 |
+
- 63
|
| 122 |
+
- 71
|
| 123 |
+
- 80
|
| 124 |
+
- 83
|
| 125 |
+
"3":
|
| 126 |
+
- 2
|
| 127 |
+
- 13
|
| 128 |
+
- 61
|
| 129 |
+
"4": 3.10.19
|
| 130 |
+
"5": 0.23.1
|
| 131 |
+
"6": 4.57.3
|
| 132 |
+
"12": 0.23.1
|
| 133 |
+
"13": linux-x86_64
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/output.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/requirements.txt
ADDED
|
@@ -0,0 +1,190 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
starVLA==1.0.1
|
| 2 |
+
absl-py==2.3.1
|
| 3 |
+
accelerate==1.5.2
|
| 4 |
+
albucore==0.0.17
|
| 5 |
+
albumentations==1.4.18
|
| 6 |
+
annotated-types==0.7.0
|
| 7 |
+
antlr4-python3-runtime==4.9.3
|
| 8 |
+
anyio==4.12.0
|
| 9 |
+
asttokens==3.0.1
|
| 10 |
+
attrs==20.3.0
|
| 11 |
+
av==12.3.0
|
| 12 |
+
bddl==1.0.1
|
| 13 |
+
certifi==2025.11.12
|
| 14 |
+
charset-normalizer==3.4.4
|
| 15 |
+
click==8.3.1
|
| 16 |
+
cloudpickle==3.1.2
|
| 17 |
+
contourpy==1.3.2
|
| 18 |
+
cramjam==2.11.0
|
| 19 |
+
cycler==0.12.1
|
| 20 |
+
debugpy==1.8.19
|
| 21 |
+
decorator==5.2.1
|
| 22 |
+
decord==0.6.0
|
| 23 |
+
deepspeed==0.16.9
|
| 24 |
+
diffusers==0.36.0
|
| 25 |
+
docstring_parser==0.17.0
|
| 26 |
+
easydict==1.9
|
| 27 |
+
einops==0.8.1
|
| 28 |
+
etils==1.13.0
|
| 29 |
+
eva-decord==0.6.1
|
| 30 |
+
eval_type_backport==0.3.1
|
| 31 |
+
exceptiongroup==1.3.1
|
| 32 |
+
executing==2.2.1
|
| 33 |
+
fastjsonschema==2.21.2
|
| 34 |
+
fastparquet==2024.11.0
|
| 35 |
+
filelock==3.20.2
|
| 36 |
+
flash_attn==2.8.3
|
| 37 |
+
fonttools==4.61.1
|
| 38 |
+
fsspec==2025.12.0
|
| 39 |
+
future==0.18.2
|
| 40 |
+
fvcore==0.1.5.post20221221
|
| 41 |
+
gevent==25.9.1
|
| 42 |
+
gitdb==4.0.12
|
| 43 |
+
GitPython==3.1.46
|
| 44 |
+
glfw==2.10.0
|
| 45 |
+
greenlet==3.3.0
|
| 46 |
+
grpcio==1.76.0
|
| 47 |
+
gym==0.26.2
|
| 48 |
+
gym-notices==0.1.0
|
| 49 |
+
h11==0.16.0
|
| 50 |
+
hf-xet==1.2.0
|
| 51 |
+
hjson==3.1.0
|
| 52 |
+
httpcore==1.0.9
|
| 53 |
+
httpx==0.28.1
|
| 54 |
+
huggingface-hub==0.36.0
|
| 55 |
+
idna==3.11
|
| 56 |
+
ImageIO==2.37.2
|
| 57 |
+
importlib_metadata==8.7.1
|
| 58 |
+
importlib_resources==6.5.2
|
| 59 |
+
iniconfig==2.3.0
|
| 60 |
+
iopath==0.1.10
|
| 61 |
+
ipdb==0.13.13
|
| 62 |
+
ipython==8.37.0
|
| 63 |
+
jedi==0.19.2
|
| 64 |
+
Jinja2==3.1.6
|
| 65 |
+
jsonschema==4.17.3
|
| 66 |
+
jupyter_core==5.9.1
|
| 67 |
+
jupytext==1.18.1
|
| 68 |
+
kiwisolver==1.4.9
|
| 69 |
+
lazy_loader==0.4
|
| 70 |
+
libero==0.1.0
|
| 71 |
+
llvmlite==0.46.0
|
| 72 |
+
Markdown==3.10
|
| 73 |
+
markdown-it-py==4.0.0
|
| 74 |
+
MarkupSafe==3.0.3
|
| 75 |
+
matplotlib==3.10.8
|
| 76 |
+
matplotlib-inline==0.2.1
|
| 77 |
+
mdit-py-plugins==0.5.0
|
| 78 |
+
mdurl==0.1.2
|
| 79 |
+
mpmath==1.3.0
|
| 80 |
+
msgpack==1.1.2
|
| 81 |
+
mujoco==3.4.0
|
| 82 |
+
nbformat==5.10.4
|
| 83 |
+
networkx==3.4.2
|
| 84 |
+
ninja==1.13.0
|
| 85 |
+
numba==0.63.1
|
| 86 |
+
numpy==1.26.4
|
| 87 |
+
numpydantic==1.6.9
|
| 88 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 89 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 90 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 91 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 92 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 93 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 94 |
+
nvidia-curand-cu12==10.3.5.147
|
| 95 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 96 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 97 |
+
nvidia-nccl-cu12==2.21.5
|
| 98 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 99 |
+
nvidia-nvtx-cu12==12.4.127
|
| 100 |
+
omegaconf==2.3.0
|
| 101 |
+
opencv-python==4.11.0.86
|
| 102 |
+
opencv-python-headless==4.11.0.86
|
| 103 |
+
packaging==25.0
|
| 104 |
+
pandas==2.3.3
|
| 105 |
+
parso==0.8.5
|
| 106 |
+
pexpect==4.9.0
|
| 107 |
+
pillow==12.1.0
|
| 108 |
+
pipablepytorch3d==0.7.6
|
| 109 |
+
platformdirs==4.5.1
|
| 110 |
+
pluggy==1.6.0
|
| 111 |
+
portalocker==3.2.0
|
| 112 |
+
prompt_toolkit==3.0.52
|
| 113 |
+
protobuf==6.33.2
|
| 114 |
+
psutil==7.2.1
|
| 115 |
+
ptyprocess==0.7.0
|
| 116 |
+
pure_eval==0.2.3
|
| 117 |
+
py-cpuinfo==9.0.0
|
| 118 |
+
pyarrow==14.0.1
|
| 119 |
+
pydantic==2.10.6
|
| 120 |
+
pydantic_core==2.27.2
|
| 121 |
+
Pygments==2.19.2
|
| 122 |
+
PyOpenGL==3.1.10
|
| 123 |
+
pyparsing==3.3.1
|
| 124 |
+
pyrsistent==0.20.0
|
| 125 |
+
pytest==9.0.2
|
| 126 |
+
python-dateutil==2.9.0.post0
|
| 127 |
+
pytz==2025.2
|
| 128 |
+
PyYAML==6.0.3
|
| 129 |
+
qwen-vl-utils==0.0.14
|
| 130 |
+
regex==2025.11.3
|
| 131 |
+
requests==2.32.5
|
| 132 |
+
rich==14.2.0
|
| 133 |
+
robosuite==1.4.0
|
| 134 |
+
safetensors==0.7.0
|
| 135 |
+
scikit-image==0.25.2
|
| 136 |
+
scipy==1.15.3
|
| 137 |
+
sentry-sdk==2.48.0
|
| 138 |
+
setuptools==80.9.0
|
| 139 |
+
six==1.17.0
|
| 140 |
+
smmap==5.0.2
|
| 141 |
+
stack-data==0.6.3
|
| 142 |
+
starVLA==1.0.1
|
| 143 |
+
sympy==1.13.1
|
| 144 |
+
tabulate==0.9.0
|
| 145 |
+
tensorboard==2.20.0
|
| 146 |
+
tensorboard-data-server==0.7.2
|
| 147 |
+
termcolor==3.3.0
|
| 148 |
+
tifffile==2025.5.10
|
| 149 |
+
tiktoken==0.12.0
|
| 150 |
+
timm==1.0.22
|
| 151 |
+
tokenizers==0.22.1
|
| 152 |
+
tomli==2.3.0
|
| 153 |
+
torch==2.5.1
|
| 154 |
+
torchvision==0.20.1
|
| 155 |
+
tqdm==4.67.1
|
| 156 |
+
traitlets==5.14.3
|
| 157 |
+
transformers==4.57.3
|
| 158 |
+
transformers-stream-generator==0.0.4
|
| 159 |
+
triton==3.1.0
|
| 160 |
+
typeguard==4.4.4
|
| 161 |
+
typing_extensions==4.15.0
|
| 162 |
+
tyro==1.0.3
|
| 163 |
+
tzdata==2025.3
|
| 164 |
+
urllib3==2.6.2
|
| 165 |
+
wandb==0.23.1
|
| 166 |
+
wcwidth==0.2.14
|
| 167 |
+
websocket==0.2.1
|
| 168 |
+
websocket-client==1.8.0
|
| 169 |
+
websockets==15.0.1
|
| 170 |
+
Werkzeug==3.1.4
|
| 171 |
+
yacs==0.1.8
|
| 172 |
+
zipp==3.23.0
|
| 173 |
+
zope.event==6.1
|
| 174 |
+
zope.interface==8.1.1
|
| 175 |
+
autocommand==2.2.2
|
| 176 |
+
backports.tarfile==1.2.0
|
| 177 |
+
importlib_metadata==8.0.0
|
| 178 |
+
inflect==7.3.1
|
| 179 |
+
jaraco.collections==5.1.0
|
| 180 |
+
jaraco.context==5.3.0
|
| 181 |
+
jaraco.functools==4.0.1
|
| 182 |
+
jaraco.text==3.12.1
|
| 183 |
+
more-itertools==10.3.0
|
| 184 |
+
packaging==24.2
|
| 185 |
+
platformdirs==4.2.2
|
| 186 |
+
tomli==2.0.1
|
| 187 |
+
typeguard==4.3.0
|
| 188 |
+
typing_extensions==4.12.2
|
| 189 |
+
wheel==0.45.1
|
| 190 |
+
zipp==3.19.2
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,122 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36",
|
| 3 |
+
"python": "CPython 3.10.19",
|
| 4 |
+
"startedAt": "2026-01-12T05:32:56.070975Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--config_yaml",
|
| 7 |
+
"scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml",
|
| 8 |
+
"--framework.name",
|
| 9 |
+
"QwenOFT",
|
| 10 |
+
"--framework.qwenvl.base_vlm",
|
| 11 |
+
"/home/tiger/.cache/huggingface/hub/models--Qwen--Qwen3-VL-8B-Instruct/snapshots/0c351dd01ed87e9c1b53cbc748cba10e6187ff3b",
|
| 12 |
+
"--datasets.vla_data.data_root_dir",
|
| 13 |
+
"./playground/Datasets/OXE_LEROBOT",
|
| 14 |
+
"--datasets.vla_data.data_mix",
|
| 15 |
+
"bridge_rt_1",
|
| 16 |
+
"--datasets.vla_data.per_device_batch_size",
|
| 17 |
+
"8",
|
| 18 |
+
"--trainer.freeze_modules",
|
| 19 |
+
"--trainer.max_train_steps",
|
| 20 |
+
"100000",
|
| 21 |
+
"--trainer.save_interval",
|
| 22 |
+
"10000",
|
| 23 |
+
"--trainer.logging_frequency",
|
| 24 |
+
"50",
|
| 25 |
+
"--trainer.eval_interval",
|
| 26 |
+
"200",
|
| 27 |
+
"--run_root_dir",
|
| 28 |
+
"./Checkpoints",
|
| 29 |
+
"--run_id",
|
| 30 |
+
"qwen3vl_bridge_rt1_QwenOFT_0112_1323",
|
| 31 |
+
"--output_dir",
|
| 32 |
+
"./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323",
|
| 33 |
+
"--wandb.project",
|
| 34 |
+
"Qwen3VL_Bridge_RT1_QwenOFT",
|
| 35 |
+
"--wandb.entity",
|
| 36 |
+
"lookas"
|
| 37 |
+
],
|
| 38 |
+
"program": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py",
|
| 39 |
+
"codePath": "starVLA/training/train_starvla.py",
|
| 40 |
+
"codePathLocal": "starVLA/training/train_starvla.py",
|
| 41 |
+
"git": {
|
| 42 |
+
"remote": "https://github.com/hilookas/starVLA_pickxiguapi",
|
| 43 |
+
"commit": "ab531aff5b27795879c61f67892330a616e9dbf0"
|
| 44 |
+
},
|
| 45 |
+
"email": "hilookas@gmail.com",
|
| 46 |
+
"root": "./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb",
|
| 47 |
+
"host": "g340-cd51-7700-770-343f-3fec-69bb",
|
| 48 |
+
"executable": "/mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3",
|
| 49 |
+
"cpu_count": 90,
|
| 50 |
+
"cpu_count_logical": 180,
|
| 51 |
+
"gpu": "NVIDIA H20",
|
| 52 |
+
"gpu_count": 8,
|
| 53 |
+
"disk": {
|
| 54 |
+
"/": {
|
| 55 |
+
"total": "3779301580800",
|
| 56 |
+
"used": "159098298368"
|
| 57 |
+
}
|
| 58 |
+
},
|
| 59 |
+
"memory": {
|
| 60 |
+
"total": "2071188119552"
|
| 61 |
+
},
|
| 62 |
+
"gpu_nvidia": [
|
| 63 |
+
{
|
| 64 |
+
"name": "NVIDIA H20",
|
| 65 |
+
"memoryTotal": "102625181696",
|
| 66 |
+
"cudaCores": 9984,
|
| 67 |
+
"architecture": "Hopper",
|
| 68 |
+
"uuid": "GPU-f99bae5f-ffca-4972-6420-64c42ba64f22"
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"name": "NVIDIA H20",
|
| 72 |
+
"memoryTotal": "102625181696",
|
| 73 |
+
"cudaCores": 9984,
|
| 74 |
+
"architecture": "Hopper",
|
| 75 |
+
"uuid": "GPU-a00709c9-6bdf-4011-64dc-95421da94ba4"
|
| 76 |
+
},
|
| 77 |
+
{
|
| 78 |
+
"name": "NVIDIA H20",
|
| 79 |
+
"memoryTotal": "102625181696",
|
| 80 |
+
"cudaCores": 9984,
|
| 81 |
+
"architecture": "Hopper",
|
| 82 |
+
"uuid": "GPU-726de9f6-32e7-ef4d-fc34-6c13a008a3d5"
|
| 83 |
+
},
|
| 84 |
+
{
|
| 85 |
+
"name": "NVIDIA H20",
|
| 86 |
+
"memoryTotal": "102625181696",
|
| 87 |
+
"cudaCores": 9984,
|
| 88 |
+
"architecture": "Hopper",
|
| 89 |
+
"uuid": "GPU-1d552a6f-4f40-493c-bbb6-dc23034730f9"
|
| 90 |
+
},
|
| 91 |
+
{
|
| 92 |
+
"name": "NVIDIA H20",
|
| 93 |
+
"memoryTotal": "102625181696",
|
| 94 |
+
"cudaCores": 9984,
|
| 95 |
+
"architecture": "Hopper",
|
| 96 |
+
"uuid": "GPU-6ffcbe46-9c9e-f1d6-e58a-ea13190e3218"
|
| 97 |
+
},
|
| 98 |
+
{
|
| 99 |
+
"name": "NVIDIA H20",
|
| 100 |
+
"memoryTotal": "102625181696",
|
| 101 |
+
"cudaCores": 9984,
|
| 102 |
+
"architecture": "Hopper",
|
| 103 |
+
"uuid": "GPU-90d2ce1a-4682-8d99-af06-2477b3d3bcde"
|
| 104 |
+
},
|
| 105 |
+
{
|
| 106 |
+
"name": "NVIDIA H20",
|
| 107 |
+
"memoryTotal": "102625181696",
|
| 108 |
+
"cudaCores": 9984,
|
| 109 |
+
"architecture": "Hopper",
|
| 110 |
+
"uuid": "GPU-4fa493fc-c408-182f-138e-bcc15c7f9138"
|
| 111 |
+
},
|
| 112 |
+
{
|
| 113 |
+
"name": "NVIDIA H20",
|
| 114 |
+
"memoryTotal": "102625181696",
|
| 115 |
+
"cudaCores": 9984,
|
| 116 |
+
"architecture": "Hopper",
|
| 117 |
+
"uuid": "GPU-16ef9185-6132-8620-ad2e-1f8920ded508"
|
| 118 |
+
}
|
| 119 |
+
],
|
| 120 |
+
"cudaVersion": "12.4",
|
| 121 |
+
"writerId": "3h4xzexd9mhzcjwlbp7j0zfzyqq963et"
|
| 122 |
+
}
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"epoch":0.85,"data_time":0.7947496069828048,"mse_score":0.007877199777535029,"_wandb":{"runtime":121936},"action_dit_loss":0.0705610066652298,"model_time":0.9573145949980244,"learning_rate":5e-07,"_runtime":121936.771979222,"_timestamp":1.7683178622202885e+09,"_step":100000}
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-12T13:33:02.374820947+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-12T13:33:03.82154982+08:00","level":"INFO","msg":"stream: created new stream","id":"ueywjhk5"}
|
| 3 |
+
{"time":"2026-01-12T13:33:03.821725323+08:00","level":"INFO","msg":"handler: started","stream_id":"ueywjhk5"}
|
| 4 |
+
{"time":"2026-01-12T13:33:03.846752186+08:00","level":"INFO","msg":"stream: started","id":"ueywjhk5"}
|
| 5 |
+
{"time":"2026-01-12T13:33:03.846770681+08:00","level":"INFO","msg":"writer: started","stream_id":"ueywjhk5"}
|
| 6 |
+
{"time":"2026-01-12T13:33:03.846770288+08:00","level":"INFO","msg":"sender: started","stream_id":"ueywjhk5"}
|
| 7 |
+
{"time":"2026-01-12T14:18:31.589248229+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 8 |
+
{"time":"2026-01-12T14:39:00.33374833+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 9 |
+
{"time":"2026-01-12T14:45:00.196854395+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 10 |
+
{"time":"2026-01-12T15:30:49.608798424+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": net/http: request canceled while waiting for connection (Client.Timeout exceeded while awaiting headers)"}
|
| 11 |
+
{"time":"2026-01-12T15:58:15.168936649+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 12 |
+
{"time":"2026-01-12T16:32:15.169856477+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 13 |
+
{"time":"2026-01-12T16:32:28.120660769+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 14 |
+
{"time":"2026-01-12T18:52:15.110123119+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-12T20:25:15.093766297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 16 |
+
{"time":"2026-01-12T20:46:29.622105415+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": Gateway Timeout"}
|
| 17 |
+
{"time":"2026-01-12T20:57:51.676789447+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-01-12T21:34:03.873286543+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-01-12T21:57:16.546518785+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-01-12T22:29:15.864952943+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 21 |
+
{"time":"2026-01-12T22:36:13.618868987+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 22 |
+
{"time":"2026-01-12T22:36:31.272703076+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 23 |
+
{"time":"2026-01-13T00:17:45.174009838+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 24 |
+
{"time":"2026-01-13T00:17:57.789671331+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 25 |
+
{"time":"2026-01-13T00:18:45.160525879+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 26 |
+
{"time":"2026-01-13T01:22:18.006447633+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 27 |
+
{"time":"2026-01-13T02:03:21.340298852+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 28 |
+
{"time":"2026-01-13T03:04:34.668877357+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 29 |
+
{"time":"2026-01-13T03:04:47.661210297+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 30 |
+
{"time":"2026-01-13T03:12:30.235091077+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 31 |
+
{"time":"2026-01-13T03:13:15.087092941+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 32 |
+
{"time":"2026-01-13T05:33:30.27306441+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 33 |
+
{"time":"2026-01-13T05:33:45.195585087+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 34 |
+
{"time":"2026-01-13T05:34:15.047256192+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 35 |
+
{"time":"2026-01-13T06:34:30.165692234+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 36 |
+
{"time":"2026-01-13T06:34:42.845804108+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 37 |
+
{"time":"2026-01-13T06:34:59.430634519+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 38 |
+
{"time":"2026-01-13T06:35:45.090534347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 39 |
+
{"time":"2026-01-13T06:38:45.24671956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 40 |
+
{"time":"2026-01-13T06:40:00.085760676+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 41 |
+
{"time":"2026-01-13T06:40:30.253594276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 42 |
+
{"time":"2026-01-13T06:40:45.119737819+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 43 |
+
{"time":"2026-01-13T06:41:01.006178451+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 44 |
+
{"time":"2026-01-13T09:01:01.259781836+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 45 |
+
{"time":"2026-01-13T10:20:27.160154786+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 46 |
+
{"time":"2026-01-13T11:23:00.198050425+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 47 |
+
{"time":"2026-01-13T11:24:00.137963825+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 48 |
+
{"time":"2026-01-13T11:41:16.643086394+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 49 |
+
{"time":"2026-01-13T12:21:36.803454674+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 50 |
+
{"time":"2026-01-13T12:29:23.122571501+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 51 |
+
{"time":"2026-01-13T12:59:15.208303261+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 52 |
+
{"time":"2026-01-13T13:06:15.210877761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 53 |
+
{"time":"2026-01-13T13:06:27.856833979+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 54 |
+
{"time":"2026-01-13T13:09:06.355015154+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 55 |
+
{"time":"2026-01-13T13:40:00.126142378+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 56 |
+
{"time":"2026-01-13T13:46:32.168389695+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 57 |
+
{"time":"2026-01-13T13:48:15.081349554+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 58 |
+
{"time":"2026-01-13T13:57:00.197403381+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 59 |
+
{"time":"2026-01-13T15:57:25.317460174+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 60 |
+
{"time":"2026-01-13T15:59:46.726236225+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 61 |
+
{"time":"2026-01-13T16:09:46.448847236+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 62 |
+
{"time":"2026-01-13T16:58:01.095875797+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": unexpected EOF"}
|
| 63 |
+
{"time":"2026-01-13T17:24:10.021730043+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 64 |
+
{"time":"2026-01-13T18:27:15.075407399+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 65 |
+
{"time":"2026-01-13T18:36:00.080917996+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 66 |
+
{"time":"2026-01-13T18:36:30.217018153+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 67 |
+
{"time":"2026-01-13T18:38:00.137187254+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 68 |
+
{"time":"2026-01-13T18:54:07.673379631+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 69 |
+
{"time":"2026-01-13T19:07:00.253334334+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 70 |
+
{"time":"2026-01-13T19:15:30.09514757+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream\": EOF"}
|
| 71 |
+
{"time":"2026-01-13T20:25:51.505745758+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 72 |
+
{"time":"2026-01-13T21:59:51.560168548+08:00","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/ueywjhk5/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
|
| 73 |
+
{"time":"2026-01-13T23:25:27.580587803+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 74 |
+
{"time":"2026-01-13T23:25:28.86707285+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
|
| 75 |
+
{"time":"2026-01-13T23:25:28.876898999+08:00","level":"INFO","msg":"stream: closing","id":"ueywjhk5"}
|
| 76 |
+
{"time":"2026-01-13T23:25:28.876914442+08:00","level":"INFO","msg":"handler: closed","stream_id":"ueywjhk5"}
|
| 77 |
+
{"time":"2026-01-13T23:25:28.90868024+08:00","level":"INFO","msg":"sender: closed","stream_id":"ueywjhk5"}
|
| 78 |
+
{"time":"2026-01-13T23:25:28.90870897+08:00","level":"INFO","msg":"stream: closed","id":"ueywjhk5"}
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/logs/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenOFT_0112_1323/wandb/wandb/run-20260112_133256-ueywjhk5/run-ueywjhk5.wandb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:83487df0cfa0c26289ddf787c1fe8b54cbfef38f3aa069954fbf2e6d6d683736
|
| 3 |
+
size 112544775
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/config.yaml
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
datasets:
|
| 2 |
+
vla_data:
|
| 3 |
+
CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
|
| 4 |
+
Locate their bounding boxes in [x1,y1,x2,y2] format.
|
| 5 |
+
data_mix: bridge_rt_1
|
| 6 |
+
data_root_dir: ./playground/Datasets/OXE_LEROBOT
|
| 7 |
+
dataset_py: lerobot_datasets
|
| 8 |
+
image_size:
|
| 9 |
+
- 224
|
| 10 |
+
- 224
|
| 11 |
+
per_device_batch_size: 8
|
| 12 |
+
video_backend: torchvision_av
|
| 13 |
+
framework:
|
| 14 |
+
action_model:
|
| 15 |
+
action_dim: 7
|
| 16 |
+
action_hidden_dim: 4096
|
| 17 |
+
action_model_type: DiT-B
|
| 18 |
+
future_action_window_size: 15
|
| 19 |
+
past_action_window_size: 0
|
| 20 |
+
name: QwenOFT
|
| 21 |
+
qwenvl:
|
| 22 |
+
base_vlm: /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
|
| 23 |
+
output_dir: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0117_1748
|
| 24 |
+
run_id: qwen3vl_bridge_rt1_QwenOFT_0117_1748
|
| 25 |
+
run_root_dir: ./Checkpoints
|
| 26 |
+
seed: 42
|
| 27 |
+
trainer:
|
| 28 |
+
eval_interval: 200
|
| 29 |
+
freeze_modules: true
|
| 30 |
+
gradient_accumulation_steps: 1
|
| 31 |
+
gradient_clipping: 1.0
|
| 32 |
+
is_resume: false
|
| 33 |
+
learning_rate:
|
| 34 |
+
action_model: 0.0001
|
| 35 |
+
base: 1.0e-05
|
| 36 |
+
qwen_vl_interface: 1.0e-05
|
| 37 |
+
logging_frequency: 50
|
| 38 |
+
lr_scheduler_type: cosine_with_min_lr
|
| 39 |
+
max_train_steps: 100000
|
| 40 |
+
num_warmup_steps: 10000
|
| 41 |
+
optimizer:
|
| 42 |
+
betas:
|
| 43 |
+
- 0.9
|
| 44 |
+
- 0.95
|
| 45 |
+
eps: 1.0e-08
|
| 46 |
+
weight_decay: 1.0e-08
|
| 47 |
+
save_interval: 10000
|
| 48 |
+
scheduler_specific_kwargs:
|
| 49 |
+
min_lr: 5.0e-07
|
| 50 |
+
wandb_entity: lookas
|
| 51 |
+
wandb_project: Qwen3VL_Bridge_RT1_OFT
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/dataset_statistics.json
ADDED
|
@@ -0,0 +1,264 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"oxe_bridge": {
|
| 3 |
+
"action": {
|
| 4 |
+
"mean": [
|
| 5 |
+
0.00011365935642970726,
|
| 6 |
+
6.556110747624189e-05,
|
| 7 |
+
-6.320965621853247e-05,
|
| 8 |
+
-7.205353176686913e-05,
|
| 9 |
+
-0.00019515302847139537,
|
| 10 |
+
0.0001203166029881686,
|
| 11 |
+
0.28829458355903625
|
| 12 |
+
],
|
| 13 |
+
"std": [
|
| 14 |
+
0.006909770731857718,
|
| 15 |
+
0.009684093232852218,
|
| 16 |
+
0.00896290498528129,
|
| 17 |
+
0.020121052930683073,
|
| 18 |
+
0.021582655517295487,
|
| 19 |
+
0.054723342223346974,
|
| 20 |
+
0.4543627821514982
|
| 21 |
+
],
|
| 22 |
+
"max": [
|
| 23 |
+
0.41691166162490845,
|
| 24 |
+
0.25864794850349426,
|
| 25 |
+
0.21218234300613403,
|
| 26 |
+
3.122201919555664,
|
| 27 |
+
1.8618112802505493,
|
| 28 |
+
6.272472858428955,
|
| 29 |
+
1.0
|
| 30 |
+
],
|
| 31 |
+
"min": [
|
| 32 |
+
-0.4007510244846344,
|
| 33 |
+
-0.13874775171279907,
|
| 34 |
+
-0.22553899884223938,
|
| 35 |
+
-3.2010786533355713,
|
| 36 |
+
-1.8618112802505493,
|
| 37 |
+
-6.279075622558594,
|
| 38 |
+
0.0
|
| 39 |
+
],
|
| 40 |
+
"q01": [
|
| 41 |
+
-0.02875255048274994,
|
| 42 |
+
-0.04170213546603918,
|
| 43 |
+
-0.026096721179783344,
|
| 44 |
+
-0.08052874729037285,
|
| 45 |
+
-0.09249906800687313,
|
| 46 |
+
-0.20738555490970612,
|
| 47 |
+
0.0
|
| 48 |
+
],
|
| 49 |
+
"q99": [
|
| 50 |
+
0.028306663036346436,
|
| 51 |
+
0.04089853074401617,
|
| 52 |
+
0.0401805154979229,
|
| 53 |
+
0.08173403143882751,
|
| 54 |
+
0.07760760560631752,
|
| 55 |
+
0.2038465365767479,
|
| 56 |
+
1.0
|
| 57 |
+
],
|
| 58 |
+
"mask": [
|
| 59 |
+
true,
|
| 60 |
+
true,
|
| 61 |
+
true,
|
| 62 |
+
true,
|
| 63 |
+
true,
|
| 64 |
+
true,
|
| 65 |
+
false
|
| 66 |
+
]
|
| 67 |
+
},
|
| 68 |
+
"state": {
|
| 69 |
+
"mean": [
|
| 70 |
+
0.15471743047237396,
|
| 71 |
+
0.015362550504505634,
|
| 72 |
+
0.03222028166055679,
|
| 73 |
+
0.0032453201711177826,
|
| 74 |
+
-0.038600146770477295,
|
| 75 |
+
0.05382946878671646,
|
| 76 |
+
0.0,
|
| 77 |
+
0.35406652092933655
|
| 78 |
+
],
|
| 79 |
+
"std": [
|
| 80 |
+
0.1605359274864927,
|
| 81 |
+
0.06677912092232112,
|
| 82 |
+
0.048657150951527554,
|
| 83 |
+
0.09275336958940797,
|
| 84 |
+
0.12566984746914736,
|
| 85 |
+
0.41222738578801793,
|
| 86 |
+
0.0,
|
| 87 |
+
0.4330223535305803
|
| 88 |
+
],
|
| 89 |
+
"max": [
|
| 90 |
+
0.5862360596656799,
|
| 91 |
+
0.4034728705883026,
|
| 92 |
+
0.3568263053894043,
|
| 93 |
+
1.3517684936523438,
|
| 94 |
+
1.570796251296997,
|
| 95 |
+
3.141204357147217,
|
| 96 |
+
0.0,
|
| 97 |
+
1.1121242046356201
|
| 98 |
+
],
|
| 99 |
+
"min": [
|
| 100 |
+
-0.04167502000927925,
|
| 101 |
+
-0.3563207685947418,
|
| 102 |
+
-0.15537554025650024,
|
| 103 |
+
-3.141592502593994,
|
| 104 |
+
-1.4992541074752808,
|
| 105 |
+
-3.14153790473938,
|
| 106 |
+
0.0,
|
| 107 |
+
0.04637829214334488
|
| 108 |
+
],
|
| 109 |
+
"q01": [
|
| 110 |
+
0.17102622985839844,
|
| 111 |
+
-0.1698118858039379,
|
| 112 |
+
-0.055632163770496845,
|
| 113 |
+
-0.36493172496557236,
|
| 114 |
+
-0.541871190071106,
|
| 115 |
+
-1.354275494813919,
|
| 116 |
+
0.0,
|
| 117 |
+
0.052190229296684265
|
| 118 |
+
],
|
| 119 |
+
"q99": [
|
| 120 |
+
0.45322076976299286,
|
| 121 |
+
0.2354845181107521,
|
| 122 |
+
0.19489620998501778,
|
| 123 |
+
0.3780156075954437,
|
| 124 |
+
0.27568644285202026,
|
| 125 |
+
1.8500566184520721,
|
| 126 |
+
0.0,
|
| 127 |
+
1.0105689764022827
|
| 128 |
+
]
|
| 129 |
+
},
|
| 130 |
+
"num_transitions": 1305714,
|
| 131 |
+
"num_trajectories": 53192
|
| 132 |
+
},
|
| 133 |
+
"oxe_rt1": {
|
| 134 |
+
"action": {
|
| 135 |
+
"mean": [
|
| 136 |
+
0.003493750700727105,
|
| 137 |
+
0.003132961690425873,
|
| 138 |
+
-0.0063125672750175,
|
| 139 |
+
0.02166595682501793,
|
| 140 |
+
-0.0028780836146324873,
|
| 141 |
+
0.0004565489653032273,
|
| 142 |
+
0.26771023869514465
|
| 143 |
+
],
|
| 144 |
+
"std": [
|
| 145 |
+
0.049065014465362655,
|
| 146 |
+
0.04229853739828572,
|
| 147 |
+
0.05237628880142378,
|
| 148 |
+
0.1124860236500875,
|
| 149 |
+
0.09312952783816872,
|
| 150 |
+
0.10319098309601091,
|
| 151 |
+
0.4418448662622395
|
| 152 |
+
],
|
| 153 |
+
"max": [
|
| 154 |
+
2.9984593391418457,
|
| 155 |
+
22.09052848815918,
|
| 156 |
+
2.7507524490356445,
|
| 157 |
+
1.570636510848999,
|
| 158 |
+
1.5321086645126343,
|
| 159 |
+
1.5691522359848022,
|
| 160 |
+
1.0
|
| 161 |
+
],
|
| 162 |
+
"min": [
|
| 163 |
+
-2.0204520225524902,
|
| 164 |
+
-5.497899532318115,
|
| 165 |
+
-2.031663417816162,
|
| 166 |
+
-1.569917917251587,
|
| 167 |
+
-1.569892168045044,
|
| 168 |
+
-1.570419430732727,
|
| 169 |
+
0.0
|
| 170 |
+
],
|
| 171 |
+
"q01": [
|
| 172 |
+
-0.22453527510166169,
|
| 173 |
+
-0.14820013284683228,
|
| 174 |
+
-0.231589707583189,
|
| 175 |
+
-0.3517994859814644,
|
| 176 |
+
-0.4193011274933815,
|
| 177 |
+
-0.43643461108207704,
|
| 178 |
+
0.0
|
| 179 |
+
],
|
| 180 |
+
"q99": [
|
| 181 |
+
0.17824687153100965,
|
| 182 |
+
0.14938379630446405,
|
| 183 |
+
0.21842354819178575,
|
| 184 |
+
0.5892666035890578,
|
| 185 |
+
0.35272657424211445,
|
| 186 |
+
0.44796681255102094,
|
| 187 |
+
1.0
|
| 188 |
+
],
|
| 189 |
+
"mask": [
|
| 190 |
+
true,
|
| 191 |
+
true,
|
| 192 |
+
true,
|
| 193 |
+
true,
|
| 194 |
+
true,
|
| 195 |
+
true,
|
| 196 |
+
false
|
| 197 |
+
]
|
| 198 |
+
},
|
| 199 |
+
"state": {
|
| 200 |
+
"mean": [
|
| 201 |
+
0.2799473702907562,
|
| 202 |
+
-0.04167069122195244,
|
| 203 |
+
0.38854750990867615,
|
| 204 |
+
0.21306729316711426,
|
| 205 |
+
-0.12402277439832687,
|
| 206 |
+
0.24756911396980286,
|
| 207 |
+
0.046330634504556656,
|
| 208 |
+
0.10487449914216995
|
| 209 |
+
],
|
| 210 |
+
"std": [
|
| 211 |
+
0.29342642876909925,
|
| 212 |
+
0.09174024655686211,
|
| 213 |
+
0.42569508885539115,
|
| 214 |
+
0.38616252611341306,
|
| 215 |
+
0.38314586427420927,
|
| 216 |
+
0.44433568806919804,
|
| 217 |
+
0.1263927443679382,
|
| 218 |
+
0.22122596673781084
|
| 219 |
+
],
|
| 220 |
+
"max": [
|
| 221 |
+
1.0534898042678833,
|
| 222 |
+
0.48018959164619446,
|
| 223 |
+
1.6896663904190063,
|
| 224 |
+
1.0,
|
| 225 |
+
0.9999993443489075,
|
| 226 |
+
0.9999874830245972,
|
| 227 |
+
0.9554369449615479,
|
| 228 |
+
0.9914546012878418
|
| 229 |
+
],
|
| 230 |
+
"min": [
|
| 231 |
+
-0.4436439275741577,
|
| 232 |
+
-0.9970501065254211,
|
| 233 |
+
-0.006579156965017319,
|
| 234 |
+
0.0,
|
| 235 |
+
-0.8643477559089661,
|
| 236 |
+
-0.7079970240592957,
|
| 237 |
+
-0.7688722014427185,
|
| 238 |
+
-0.4999994933605194
|
| 239 |
+
],
|
| 240 |
+
"q01": [
|
| 241 |
+
0.32481380939483645,
|
| 242 |
+
-0.28334290891885755,
|
| 243 |
+
0.14107070609927178,
|
| 244 |
+
0.0,
|
| 245 |
+
-0.686474204659462,
|
| 246 |
+
-0.6808923494815826,
|
| 247 |
+
-0.36045596331357954,
|
| 248 |
+
-0.454380963742733
|
| 249 |
+
],
|
| 250 |
+
"q99": [
|
| 251 |
+
0.8750156319141384,
|
| 252 |
+
0.21247054174542404,
|
| 253 |
+
1.0727112340927123,
|
| 254 |
+
1.0,
|
| 255 |
+
0.9377871316671368,
|
| 256 |
+
0.9563051050901409,
|
| 257 |
+
0.45990042358636823,
|
| 258 |
+
0.7216041100025177
|
| 259 |
+
]
|
| 260 |
+
},
|
| 261 |
+
"num_transitions": 3786152,
|
| 262 |
+
"num_trajectories": 87212
|
| 263 |
+
}
|
| 264 |
+
}
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/run_qwen3vl_bridge_rt1_qwen_oft.sh
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Framework_name=QwenOFT
|
| 2 |
+
dit_type="DiT-B"
|
| 3 |
+
freeze_module_list='' # fully FT, e.g., freeze_module_list=""
|
| 4 |
+
data_mix=bridge_rt_1
|
| 5 |
+
|
| 6 |
+
## Modify below paths before running ##
|
| 7 |
+
date_time=$(date +%m%d_%H%M)
|
| 8 |
+
config_yaml=scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
|
| 9 |
+
base_vlm=/home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
|
| 10 |
+
data_root_dir=./playground/Datasets/OXE_LEROBOT # local path of dataset root
|
| 11 |
+
run_root_dir=./Checkpoints
|
| 12 |
+
run_id=qwen3vl_bridge_rt1_${Framework_name}_${date_time} # run id
|
| 13 |
+
batch_size=8
|
| 14 |
+
wandb_project=Qwen3VL_Bridge_RT1_${Framework_name}
|
| 15 |
+
wandb_entity=lookas
|
| 16 |
+
|
| 17 |
+
# export WANDB_MODE=disabled
|
| 18 |
+
|
| 19 |
+
output_dir=${run_root_dir}/${run_id}
|
| 20 |
+
mkdir -p ${output_dir}
|
| 21 |
+
cp $0 ${output_dir}/
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
accelerate launch --main_process_port 12773 \
|
| 25 |
+
--config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 26 |
+
--num_processes 8 \
|
| 27 |
+
starVLA/training/train_starvla.py \
|
| 28 |
+
--config_yaml ${config_yaml} \
|
| 29 |
+
--framework.name ${Framework_name} \
|
| 30 |
+
--framework.qwenvl.base_vlm ${base_vlm} \
|
| 31 |
+
--datasets.vla_data.data_root_dir ${data_root_dir}\
|
| 32 |
+
--datasets.vla_data.data_mix ${data_mix} \
|
| 33 |
+
--datasets.vla_data.per_device_batch_size ${batch_size} \
|
| 34 |
+
--trainer.freeze_modules ${freeze_module_list} \
|
| 35 |
+
--trainer.max_train_steps 100000 \
|
| 36 |
+
--trainer.save_interval 10000 \
|
| 37 |
+
--trainer.logging_frequency 50 \
|
| 38 |
+
--trainer.eval_interval 200 \
|
| 39 |
+
--run_root_dir ${run_root_dir} \
|
| 40 |
+
--run_id ${run_id} \
|
| 41 |
+
--output_dir ${output_dir} \
|
| 42 |
+
--wandb.project ${wandb_project} \
|
| 43 |
+
--wandb.entity ${wandb_entity}
|
| 44 |
+
|
| 45 |
+
|
| 46 |
+
# multi-node launch example
|
| 47 |
+
|
| 48 |
+
# accelerate launch \
|
| 49 |
+
# --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
|
| 50 |
+
# --main_process_ip $MASTER_ADDR \
|
| 51 |
+
# --main_process_port $MASTER_PORT \
|
| 52 |
+
# --machine_rank $SLURM_PROCID \
|
| 53 |
+
# --num_machines $SLURM_NNODES \
|
| 54 |
+
# --num_processes=${TOTAL_GPUS} \
|
| 55 |
+
# starVLA/training/train_starvla.py \
|
| 56 |
+
# --config_yaml ./starVLA/config/training/starvla_cotrain_oxe.yaml \
|
| 57 |
+
# --framework.framework_py QwenGR00T \
|
| 58 |
+
# --framework.qwenvl.base_vlm microsoft/Florence-2-large \
|
| 59 |
+
# --run_root_dir ${run_root_dir} \
|
| 60 |
+
# --run_id ${run_id} \
|
| 61 |
+
# --wandb_project your_project \
|
| 62 |
+
# --wandb_entity your_name
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/summary.jsonl
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"steps": 10000}
|
| 2 |
+
{"steps": 20000}
|
| 3 |
+
{"steps": 30000}
|
| 4 |
+
{"steps": 40000}
|
| 5 |
+
{"steps": 50000}
|
| 6 |
+
{"steps": 60000}
|
| 7 |
+
{"steps": 70000}
|
| 8 |
+
{"steps": 80000}
|
| 9 |
+
{"steps": 90000}
|
| 10 |
+
{"steps": 100000}
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug-internal.log
ADDED
|
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-01-17T18:05:32.919256759+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.1"}
|
| 2 |
+
{"time":"2026-01-17T18:05:36.622867047+08:00","level":"INFO","msg":"stream: created new stream","id":"rqrn3qyr"}
|
| 3 |
+
{"time":"2026-01-17T18:05:36.623047484+08:00","level":"INFO","msg":"handler: started","stream_id":"rqrn3qyr"}
|
| 4 |
+
{"time":"2026-01-17T18:05:36.648380876+08:00","level":"INFO","msg":"stream: started","id":"rqrn3qyr"}
|
| 5 |
+
{"time":"2026-01-17T18:05:36.64839606+08:00","level":"INFO","msg":"writer: started","stream_id":"rqrn3qyr"}
|
| 6 |
+
{"time":"2026-01-17T18:05:36.648398878+08:00","level":"INFO","msg":"sender: started","stream_id":"rqrn3qyr"}
|
| 7 |
+
{"time":"2026-01-17T22:37:34.86356798+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:52928->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
|
| 8 |
+
{"time":"2026-01-17T22:54:18.423710102+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 9 |
+
{"time":"2026-01-18T00:12:50.883820737+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 10 |
+
{"time":"2026-01-18T02:09:32.843274738+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:52904->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
|
| 11 |
+
{"time":"2026-01-18T13:00:31.504000712+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:43174->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
|
| 12 |
+
{"time":"2026-01-18T15:24:38.642505893+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 13 |
+
{"time":"2026-01-18T19:01:56.523537868+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 14 |
+
{"time":"2026-01-18T20:33:30.03545379+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-01-18T20:34:13.086658278+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 16 |
+
{"time":"2026-01-18T21:46:54.335541764+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": read tcp [2605:340:cd51:7700:4fb:cd4a:6d4e:969e]:53174->[64:ff9b::23ba:e431]:443: read: connection reset by peer"}
|
| 17 |
+
{"time":"2026-01-18T21:47:09.229423294+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-01-18T23:52:58.941500301+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-01-19T02:13:36.852336596+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/lookas/Qwen3VL_Bridge_RT1_OFT/rqrn3qyr/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-01-19T02:28:43.986696739+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 21 |
+
{"time":"2026-01-19T02:28:45.179352006+08:00","level":"INFO","msg":"handler: operation stats","stats":{}}
|
| 22 |
+
{"time":"2026-01-19T02:28:45.189009251+08:00","level":"INFO","msg":"stream: closing","id":"rqrn3qyr"}
|
| 23 |
+
{"time":"2026-01-19T02:28:45.189020364+08:00","level":"INFO","msg":"handler: closed","stream_id":"rqrn3qyr"}
|
| 24 |
+
{"time":"2026-01-19T02:28:45.20863216+08:00","level":"INFO","msg":"sender: closed","stream_id":"rqrn3qyr"}
|
| 25 |
+
{"time":"2026-01-19T02:28:45.208650774+08:00","level":"INFO","msg":"stream: closed","id":"rqrn3qyr"}
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/debug.log
ADDED
|
File without changes
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/config.yaml
ADDED
|
@@ -0,0 +1,133 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_wandb:
|
| 2 |
+
value:
|
| 3 |
+
cli_version: 0.23.1
|
| 4 |
+
e:
|
| 5 |
+
5cfcqp03otctf4fyn22usch179j8xvxz:
|
| 6 |
+
args:
|
| 7 |
+
- --config_yaml
|
| 8 |
+
- scripts/ER1_5/qwen3vl_bridge_rt1_oft.yaml
|
| 9 |
+
- --framework.name
|
| 10 |
+
- QwenOFT
|
| 11 |
+
- --framework.qwenvl.base_vlm
|
| 12 |
+
- /home/tiger/.cache/huggingface/hub/models--Embodied1--Embodied-R1.5-SFT-v1/snapshots/0d2820fe1b7f598d2765b234ea69c351211b55c9
|
| 13 |
+
- --datasets.vla_data.data_root_dir
|
| 14 |
+
- ./playground/Datasets/OXE_LEROBOT
|
| 15 |
+
- --datasets.vla_data.data_mix
|
| 16 |
+
- bridge_rt_1
|
| 17 |
+
- --datasets.vla_data.per_device_batch_size
|
| 18 |
+
- "8"
|
| 19 |
+
- --trainer.freeze_modules
|
| 20 |
+
- --trainer.max_train_steps
|
| 21 |
+
- "100000"
|
| 22 |
+
- --trainer.save_interval
|
| 23 |
+
- "10000"
|
| 24 |
+
- --trainer.logging_frequency
|
| 25 |
+
- "50"
|
| 26 |
+
- --trainer.eval_interval
|
| 27 |
+
- "200"
|
| 28 |
+
- --run_root_dir
|
| 29 |
+
- ./Checkpoints
|
| 30 |
+
- --run_id
|
| 31 |
+
- qwen3vl_bridge_rt1_QwenOFT_0117_1748
|
| 32 |
+
- --output_dir
|
| 33 |
+
- ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0117_1748
|
| 34 |
+
- --wandb.project
|
| 35 |
+
- Qwen3VL_Bridge_RT1_QwenOFT
|
| 36 |
+
- --wandb.entity
|
| 37 |
+
- lookas
|
| 38 |
+
codePath: starVLA/training/train_starvla.py
|
| 39 |
+
codePathLocal: starVLA/training/train_starvla.py
|
| 40 |
+
cpu_count: 90
|
| 41 |
+
cpu_count_logical: 180
|
| 42 |
+
cudaVersion: "12.4"
|
| 43 |
+
disk:
|
| 44 |
+
/:
|
| 45 |
+
total: "3779301580800"
|
| 46 |
+
used: "151636508672"
|
| 47 |
+
email: hilookas@gmail.com
|
| 48 |
+
executable: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/.venv/bin/python3
|
| 49 |
+
git:
|
| 50 |
+
commit: ab531aff5b27795879c61f67892330a616e9dbf0
|
| 51 |
+
remote: https://github.com/hilookas/starVLA_pickxiguapi
|
| 52 |
+
gpu: NVIDIA H20
|
| 53 |
+
gpu_count: 8
|
| 54 |
+
gpu_nvidia:
|
| 55 |
+
- architecture: Hopper
|
| 56 |
+
cudaCores: 9984
|
| 57 |
+
memoryTotal: "102625181696"
|
| 58 |
+
name: NVIDIA H20
|
| 59 |
+
uuid: GPU-fb4370de-60ba-70ca-eeca-022c40ee5dc2
|
| 60 |
+
- architecture: Hopper
|
| 61 |
+
cudaCores: 9984
|
| 62 |
+
memoryTotal: "102625181696"
|
| 63 |
+
name: NVIDIA H20
|
| 64 |
+
uuid: GPU-2b87ce45-0783-3787-00a5-678fab82dff7
|
| 65 |
+
- architecture: Hopper
|
| 66 |
+
cudaCores: 9984
|
| 67 |
+
memoryTotal: "102625181696"
|
| 68 |
+
name: NVIDIA H20
|
| 69 |
+
uuid: GPU-f37740ca-0c96-508b-6014-0c7c5717ce90
|
| 70 |
+
- architecture: Hopper
|
| 71 |
+
cudaCores: 9984
|
| 72 |
+
memoryTotal: "102625181696"
|
| 73 |
+
name: NVIDIA H20
|
| 74 |
+
uuid: GPU-f59773d6-f9c1-34dc-06fa-92979c9f3c64
|
| 75 |
+
- architecture: Hopper
|
| 76 |
+
cudaCores: 9984
|
| 77 |
+
memoryTotal: "102625181696"
|
| 78 |
+
name: NVIDIA H20
|
| 79 |
+
uuid: GPU-993ec1cf-6953-aff2-fd04-2f116a004be8
|
| 80 |
+
- architecture: Hopper
|
| 81 |
+
cudaCores: 9984
|
| 82 |
+
memoryTotal: "102625181696"
|
| 83 |
+
name: NVIDIA H20
|
| 84 |
+
uuid: GPU-c1ddbd85-e0d5-97e8-cc7e-3bb01759b504
|
| 85 |
+
- architecture: Hopper
|
| 86 |
+
cudaCores: 9984
|
| 87 |
+
memoryTotal: "102625181696"
|
| 88 |
+
name: NVIDIA H20
|
| 89 |
+
uuid: GPU-e8bab208-8550-dbd6-9630-08f32d2f4fce
|
| 90 |
+
- architecture: Hopper
|
| 91 |
+
cudaCores: 9984
|
| 92 |
+
memoryTotal: "102625181696"
|
| 93 |
+
name: NVIDIA H20
|
| 94 |
+
uuid: GPU-8be9c3c0-cd15-3534-0dbd-de2c1d6aaf1d
|
| 95 |
+
host: g340-cd51-7700-4fb-cd4a-6d4e-969e
|
| 96 |
+
memory:
|
| 97 |
+
total: "2071188119552"
|
| 98 |
+
os: Linux-5.15.152.bsk.10-amd64-x86_64-with-glibc2.36
|
| 99 |
+
program: /mnt/bn/ic-vlm/personal/cuihaiqin/pickxiguapi/starVLA/starVLA/training/train_starvla.py
|
| 100 |
+
python: CPython 3.10.19
|
| 101 |
+
root: ./Checkpoints/qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb
|
| 102 |
+
startedAt: "2026-01-17T10:05:26.699051Z"
|
| 103 |
+
writerId: 5cfcqp03otctf4fyn22usch179j8xvxz
|
| 104 |
+
m: []
|
| 105 |
+
python_version: 3.10.19
|
| 106 |
+
t:
|
| 107 |
+
"1":
|
| 108 |
+
- 1
|
| 109 |
+
- 11
|
| 110 |
+
- 41
|
| 111 |
+
- 49
|
| 112 |
+
- 63
|
| 113 |
+
- 71
|
| 114 |
+
- 80
|
| 115 |
+
- 83
|
| 116 |
+
"2":
|
| 117 |
+
- 1
|
| 118 |
+
- 11
|
| 119 |
+
- 41
|
| 120 |
+
- 49
|
| 121 |
+
- 63
|
| 122 |
+
- 71
|
| 123 |
+
- 80
|
| 124 |
+
- 83
|
| 125 |
+
"3":
|
| 126 |
+
- 2
|
| 127 |
+
- 13
|
| 128 |
+
- 61
|
| 129 |
+
"4": 3.10.19
|
| 130 |
+
"5": 0.23.1
|
| 131 |
+
"6": 4.57.3
|
| 132 |
+
"12": 0.23.1
|
| 133 |
+
"13": linux-x86_64
|
qwen3vl_bridge_rt1_QwenOFT_0117_1748/wandb/wandb/run-20260117_180526-rqrn3qyr/files/output.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|