Vincent2311 commited on
Commit
41edbd7
·
verified ·
1 Parent(s): 01d79f8

Add files using upload-large-folder tool

Browse files
Files changed (17) hide show
  1. .gitattributes +1 -0
  2. franka_move_egg_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_095749-90ibcpp4/logs/debug-core.log +12 -0
  3. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/checkpoints/steps_4000_pytorch_model.pt +3 -0
  4. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/checkpoints/steps_8000_pytorch_model.pt +3 -0
  5. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/config.yaml +70 -0
  6. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/dataset_statistics.json +193 -0
  7. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/run_franka_vp_sweep_floor.sh +64 -0
  8. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/summary.jsonl +5 -0
  9. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/debug-internal.log +7 -0
  10. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/debug.log +0 -0
  11. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/files/output.log +0 -0
  12. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/files/requirements.txt +151 -0
  13. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/files/wandb-metadata.json +145 -0
  14. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/logs/debug-core.log +7 -0
  15. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/logs/debug-internal.log +7 -0
  16. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/logs/debug.log +0 -0
  17. franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/run-tqe5jdia.wandb +3 -0
.gitattributes CHANGED
@@ -36,3 +36,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
36
  franka_move_egg_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_095749-90ibcpp4/run-90ibcpp4.wandb filter=lfs diff=lfs merge=lfs -text
37
  franka_pick_color_egg_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_100004-d1v6qg5k/run-d1v6qg5k.wandb filter=lfs diff=lfs merge=lfs -text
38
  franka_filter_class_12_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_095755-tbifv35r/run-tbifv35r.wandb filter=lfs diff=lfs merge=lfs -text
 
 
36
  franka_move_egg_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_095749-90ibcpp4/run-90ibcpp4.wandb filter=lfs diff=lfs merge=lfs -text
37
  franka_pick_color_egg_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_100004-d1v6qg5k/run-d1v6qg5k.wandb filter=lfs diff=lfs merge=lfs -text
38
  franka_filter_class_12_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_095755-tbifv35r/run-tbifv35r.wandb filter=lfs diff=lfs merge=lfs -text
39
+ franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/run-tqe5jdia.wandb filter=lfs diff=lfs merge=lfs -text
franka_move_egg_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_095749-90ibcpp4/logs/debug-core.log ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-02-24T09:57:51.577330709Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpk8ekvuek/port-2123377.txt","pid":2123377,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2026-02-24T09:57:51.57779785Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2123377}
3
+ {"time":"2026-02-24T09:57:51.577811146Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2123377-2125080-277520121/socket","Net":"unix"}}
4
+ {"time":"2026-02-24T09:57:51.746355666Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2026-02-24T09:57:51.785451649Z","level":"INFO","msg":"handleInformInit: received","streamId":"90ibcpp4","id":"1(@)"}
6
+ {"time":"2026-02-24T09:57:52.526160263Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"90ibcpp4","id":"1(@)"}
7
+ {"time":"2026-02-24T16:37:49.71580804Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2026-02-24T16:37:49.715892812Z","level":"INFO","msg":"server is shutting down"}
9
+ {"time":"2026-02-24T16:37:49.715882133Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
+ {"time":"2026-02-24T16:37:49.715968099Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2123377-2125080-277520121/socket","Net":"unix"}}
11
+ {"time":"2026-02-24T16:37:49.716029087Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
12
+ {"time":"2026-02-24T16:37:52.398753968Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/checkpoints/steps_4000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c738eb67c6a2986b64f280a4c8aefd4ceecce7e9c3601c2efff22045e62e2d18
3
+ size 9785060316
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/checkpoints/steps_8000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42c8e0dbeb330b7b709bc0e358cb3e3e38045d1d114da794dffef98475e911d3
3
+ size 9785060316
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/config.yaml ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ datasets:
2
+ vla_data:
3
+ CoT_prompt: Your task is {instruction}. To identify the key objects for your task.
4
+ Locate their bounding boxes in [x1,y1,x2,y2] format.
5
+ data_mix: smartmore_franka_sweep_floor
6
+ data_root_dir: /gpfs/wangzixuan/visual_prompting/real_data/lerobot
7
+ dataset_py: visual_prompt_datasets
8
+ delete_pause_frame: false
9
+ feed_both_images: true
10
+ image_size:
11
+ - 224
12
+ - 224
13
+ num_workers: 4
14
+ per_device_batch_size: 32
15
+ target_location_prompt_type: box
16
+ target_object_prompt_type: crosshair
17
+ use_subtask: false
18
+ video_backend: pyav
19
+ visual_prompt_dir: /gpfs/wangzixuan/visual_prompting/starVLA_robocasa/realdata_process/visual_prompts_output
20
+ vp_data:
21
+ dataset_py: visual_prompt_prediction_datasets
22
+ extracted_frames_dir: /gpfs/wangzixuan/visual_prompting/real_data/extracted_frames
23
+ feed_both_images: false
24
+ num_workers: 4
25
+ per_device_batch_size: 8
26
+ target_location_prompt_type: box
27
+ target_object_prompt_type: crosshair
28
+ visual_prompt_dir: /gpfs/wangzixuan/visual_prompting/starVLA_robocasa/realdata_process/visual_prompts_output
29
+ framework:
30
+ action_model:
31
+ action_dim: 7
32
+ action_hidden_dim: 2560
33
+ action_model_type: DiT-B
34
+ future_action_window_size: 15
35
+ past_action_window_size: 0
36
+ name: QwenOFT
37
+ qwenvl:
38
+ base_vlm: /gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Pretrained_models/Qwen3-VL-4B-Instruct
39
+ output_dir: /gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Checkpoints/franka_sweep_floor_visual_prompt_QwenOFT_4k_save
40
+ run_id: franka_sweep_floor_visual_prompt_QwenOFT_4k_save
41
+ run_root_dir: /gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Checkpoints
42
+ seed: 42
43
+ trainer:
44
+ eval_interval: 100
45
+ freeze_modules: null
46
+ gradient_accumulation_steps: 1
47
+ gradient_clipping: 1.0
48
+ is_resume: false
49
+ learning_rate:
50
+ action_model: 0.0001
51
+ base: 3.0e-05
52
+ qwen_vl_interface: 1.0e-05
53
+ logging_frequency: 10
54
+ loss_scale:
55
+ visual_prompt: 0.1
56
+ vla: 1.0
57
+ lr_scheduler_type: cosine_with_min_lr
58
+ max_train_steps: 100000
59
+ num_warmup_steps: 5000
60
+ optimizer:
61
+ betas:
62
+ - 0.9
63
+ - 0.95
64
+ eps: 1.0e-08
65
+ weight_decay: 1.0e-08
66
+ save_interval: 4000
67
+ scheduler_specific_kwargs:
68
+ min_lr: 5.0e-07
69
+ wandb_entity: zwanggk
70
+ wandb_project: franka_visual_prompt
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/dataset_statistics.json ADDED
@@ -0,0 +1,193 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "franka": {
3
+ "action": {
4
+ "mean": [
5
+ -0.08061821013689041,
6
+ 0.03849069029092789,
7
+ -0.0030605667270720005,
8
+ 0.009368009865283966,
9
+ 0.1017644926905632,
10
+ -0.056130748242139816,
11
+ -0.7683464288711548
12
+ ],
13
+ "std": [
14
+ 0.2117806375026703,
15
+ 0.2864035665988922,
16
+ 0.13817094266414642,
17
+ 0.10838928073644638,
18
+ 0.16133905947208405,
19
+ 0.1992710679769516,
20
+ 0.6400538682937622
21
+ ],
22
+ "max": [
23
+ 0.5275262594223022,
24
+ 0.7144172787666321,
25
+ 0.5165083408355713,
26
+ 0.4824982285499573,
27
+ 0.9452001452445984,
28
+ 0.7411012053489685,
29
+ 1.0
30
+ ],
31
+ "min": [
32
+ -0.9114958643913269,
33
+ -0.6978311538696289,
34
+ -0.5033432245254517,
35
+ -0.5841054916381836,
36
+ -0.34298428893089294,
37
+ -0.8224282264709473,
38
+ -1.0
39
+ ],
40
+ "q01": [
41
+ -0.6588279324769973,
42
+ -0.5336342138051987,
43
+ -0.36370937585830687,
44
+ -0.2552451795339584,
45
+ -0.1805216257274151,
46
+ -0.5486886489391327,
47
+ -1.0
48
+ ],
49
+ "q99": [
50
+ 0.36296284645795784,
51
+ 0.5701563268899916,
52
+ 0.3194278168678283,
53
+ 0.29448106050491324,
54
+ 0.6076501923799508,
55
+ 0.5486402970552432,
56
+ 1.0
57
+ ],
58
+ "mask": [
59
+ true,
60
+ true,
61
+ true,
62
+ true,
63
+ true,
64
+ true,
65
+ false
66
+ ]
67
+ },
68
+ "state": {
69
+ "mean": [
70
+ 0.22929246723651886,
71
+ -0.5722187757492065,
72
+ 1.0862715244293213,
73
+ 0.31304726004600525,
74
+ -0.1627047061920166,
75
+ 0.08631913363933563,
76
+ 0.009877122938632965,
77
+ -0.01609046943485737,
78
+ 0.033343397080898285,
79
+ -0.10010933130979538,
80
+ 0.4062647223472595,
81
+ 0.4920309782028198,
82
+ -0.2398146241903305,
83
+ -0.013218171894550323,
84
+ 0.005303372163325548,
85
+ -0.0011343698715791106,
86
+ -0.00033812131732702255,
87
+ -0.0013084859820082784
88
+ ],
89
+ "std": [
90
+ 0.28804537653923035,
91
+ 1.4905784130096436,
92
+ 2.7105965614318848,
93
+ 3.2822203636169434,
94
+ 0.06618736684322357,
95
+ 0.056241098791360855,
96
+ 0.017126617953181267,
97
+ 0.05620327964425087,
98
+ 0.04887595400214195,
99
+ 0.1578141152858734,
100
+ 0.6731232404708862,
101
+ 0.8422963619232178,
102
+ 0.42211294174194336,
103
+ 0.036596521735191345,
104
+ 0.045121997594833374,
105
+ 0.02080458588898182,
106
+ 0.05005611479282379,
107
+ 0.028937384486198425
108
+ ],
109
+ "max": [
110
+ 1.0,
111
+ 4.891953945159912,
112
+ 8.139209747314453,
113
+ 18.370073318481445,
114
+ 0.05588706210255623,
115
+ 0.19642794132232666,
116
+ 0.053001727908849716,
117
+ 0.14991311728954315,
118
+ 0.1340937465429306,
119
+ 0.4335828721523285,
120
+ 3.3109123706817627,
121
+ 3.689563751220703,
122
+ 0.9833556413650513,
123
+ 0.10158777236938477,
124
+ 0.11944770067930222,
125
+ 0.08162833005189896,
126
+ 0.16560785472393036,
127
+ 0.15716767311096191
128
+ ],
129
+ "min": [
130
+ 0.11884058266878128,
131
+ -4.3707990646362305,
132
+ -6.562924385070801,
133
+ -5.218995571136475,
134
+ -0.29098546504974365,
135
+ -0.024652721360325813,
136
+ -0.0493561252951622,
137
+ -0.14546364545822144,
138
+ -0.11700249463319778,
139
+ -0.6988881826400757,
140
+ -1.7946170568466187,
141
+ -2.162982225418091,
142
+ -0.8562780022621155,
143
+ -0.16190604865550995,
144
+ -0.12078742682933807,
145
+ -0.09719698131084442,
146
+ -0.20046618580818176,
147
+ -0.1426655799150467
148
+ ],
149
+ "q01": [
150
+ 0.11980676651000977,
151
+ -3.0677114605903624,
152
+ -3.420012638568878,
153
+ -3.6503843212127687,
154
+ -0.26542589694261554,
155
+ -0.009954770766198636,
156
+ -0.03184773214161396,
157
+ -0.12729241982102393,
158
+ -0.09293058753013611,
159
+ -0.5558860898017883,
160
+ -1.0219422972202301,
161
+ -1.4959156274795533,
162
+ -0.7284153574705123,
163
+ -0.11884139612317085,
164
+ -0.09057404629886151,
165
+ -0.06277803622186184,
166
+ -0.1031051080673933,
167
+ -0.06691223375499249
168
+ ],
169
+ "q99": [
170
+ 1.0,
171
+ 2.857337474822997,
172
+ 6.436479039192197,
173
+ 10.735821895599347,
174
+ 0.0116989194042979,
175
+ 0.1804287213087081,
176
+ 0.045605253279209126,
177
+ 0.10734622143208977,
178
+ 0.117441693469882,
179
+ 0.1687981204688547,
180
+ 2.173126604557031,
181
+ 2.767596554756164,
182
+ 0.6548447203636169,
183
+ 0.06324124120175834,
184
+ 0.09241089537739751,
185
+ 0.05182413879781959,
186
+ 0.1108243534713983,
187
+ 0.08060484960675215
188
+ ]
189
+ },
190
+ "num_transitions": 10438,
191
+ "num_trajectories": 70
192
+ }
193
+ }
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/run_franka_vp_sweep_floor.sh ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ # Visual Prompt Training Script for Franka - sweep_floor
3
+
4
+ export NCCL_SOCKET_IFNAME=bond0
5
+ export NCCL_IB_HCA=mlx5_2,mlx5_3
6
+
7
+ export NCCL_BLOCKING_WAIT=1
8
+ export NCCL_ASYNC_ERROR_HANDLING=1
9
+ export TORCH_NCCL_BLOCKING_WAIT=1
10
+ export TORCH_NCCL_ASYNC_ERROR_HANDLING=1
11
+
12
+ export NCCL_TIMEOUT=3600
13
+ export TORCH_DISTRIBUTED_DEBUG=DETAIL
14
+
15
+ Framework_name=QwenOFT
16
+ base_vlm=/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Pretrained_models/Qwen3-VL-4B-Instruct
17
+ freeze_module_list=''
18
+ DIT_TYPE="DiT-B"
19
+
20
+ # Data paths
21
+ data_root_dir=/gpfs/wangzixuan/visual_prompting/real_data/lerobot
22
+ visual_prompt_dir=/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/realdata_process/visual_prompts_output
23
+ extracted_frames_dir=/gpfs/wangzixuan/visual_prompting/real_data/extracted_frames
24
+ data_mix=smartmore_franka_sweep_floor
25
+
26
+ # Output
27
+ run_root_dir=/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Checkpoints
28
+ run_id=franka_sweep_floor_visual_prompt_QwenOFT_4k_save
29
+
30
+ output_dir=${run_root_dir}/${run_id}
31
+ mkdir -p ${output_dir}
32
+ cp $0 ${output_dir}/
33
+
34
+ accelerate launch \
35
+ --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
36
+ --num_processes 8 \
37
+ starVLA/training/train_starvla_visual_prompt.py \
38
+ --config_yaml ./examples/Franka/train_files/starvla_cotrain_franka_visual_prompt.yaml \
39
+ --framework.name ${Framework_name} \
40
+ --framework.qwenvl.base_vlm ${base_vlm} \
41
+ --framework.action_model.action_model_type ${DIT_TYPE} \
42
+ --datasets.vla_data.data_root_dir ${data_root_dir} \
43
+ --datasets.vla_data.visual_prompt_dir ${visual_prompt_dir} \
44
+ --datasets.vla_data.data_mix ${data_mix} \
45
+ --datasets.vla_data.per_device_batch_size 32 \
46
+ --datasets.vla_data.video_backend pyav \
47
+ --datasets.vp_data.visual_prompt_dir ${visual_prompt_dir} \
48
+ --datasets.vp_data.extracted_frames_dir ${extracted_frames_dir} \
49
+ --datasets.vp_data.per_device_batch_size 8 \
50
+ --trainer.freeze_modules "${freeze_module_list}" \
51
+ --trainer.max_train_steps 100000 \
52
+ --trainer.save_interval 4000 \
53
+ --trainer.logging_frequency 10 \
54
+ --trainer.eval_interval 100 \
55
+ --trainer.learning_rate.base 3e-5 \
56
+ --trainer.learning_rate.qwen_vl_interface 1e-5 \
57
+ --trainer.loss_scale.visual_prompt 0.1 \
58
+ --datasets.vla_data.use_subtask false \
59
+ --datasets.vla_data.feed_both_images true \
60
+ --datasets.vp_data.feed_both_images false \
61
+ --run_root_dir ${run_root_dir} \
62
+ --run_id ${run_id} \
63
+ --wandb_project franka_visual_prompt \
64
+ --wandb_entity zwanggk
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/summary.jsonl ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {"steps": 4000}
2
+ {"steps": 8000}
3
+ {"steps": 12000}
4
+ {"steps": 16000}
5
+ {"steps": 20000}
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2026-02-24T16:40:45.965620169Z","level":"INFO","msg":"stream: starting","core version":"0.24.0"}
2
+ {"time":"2026-02-24T16:40:46.669645148Z","level":"INFO","msg":"stream: created new stream","id":"tqe5jdia"}
3
+ {"time":"2026-02-24T16:40:46.669716806Z","level":"INFO","msg":"handler: started","stream_id":"tqe5jdia"}
4
+ {"time":"2026-02-24T16:40:46.67387105Z","level":"INFO","msg":"stream: started","id":"tqe5jdia"}
5
+ {"time":"2026-02-24T16:40:46.673890028Z","level":"INFO","msg":"writer: started","stream_id":"tqe5jdia"}
6
+ {"time":"2026-02-24T16:40:46.673898689Z","level":"INFO","msg":"sender: started","stream_id":"tqe5jdia"}
7
+ {"time":"2026-02-24T20:02:32.700623026Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/zwanggk/franka_visual_prompt/tqe5jdia/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/debug.log ADDED
File without changes
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/files/requirements.txt ADDED
@@ -0,0 +1,151 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ starVLA==1.0.1
2
+ docstring_parser==0.17.0
3
+ pydantic_core==2.27.2
4
+ py-cpuinfo==9.0.0
5
+ Werkzeug==3.1.5
6
+ pandas==2.3.3
7
+ kiwisolver==1.4.9
8
+ httpcore==1.0.9
9
+ nvidia-cuda-runtime-cu12==12.4.127
10
+ Jinja2==3.1.6
11
+ exceptiongroup==1.3.1
12
+ filelock==3.20.3
13
+ torchvision==0.21.0
14
+ gitdb==4.0.12
15
+ fastparquet==2024.11.0
16
+ tensorboard==2.20.0
17
+ portalocker==3.2.0
18
+ timm==1.0.24
19
+ nvidia-nvjitlink-cu12==12.4.127
20
+ nvidia-cudnn-cu12==9.1.0.70
21
+ pyparsing==3.3.2
22
+ protobuf==6.33.4
23
+ nvitop==1.6.2
24
+ importlib_metadata==8.7.1
25
+ GitPython==3.1.46
26
+ annotated-types==0.7.0
27
+ antlr4-python3-runtime==4.9.3
28
+ yacs==0.1.8
29
+ contourpy==1.3.2
30
+ charset-normalizer==3.4.4
31
+ hjson==3.1.0
32
+ tensorboard-data-server==0.7.2
33
+ six==1.17.0
34
+ nvidia-cuda-cupti-cu12==12.4.127
35
+ tqdm==4.67.1
36
+ h11==0.16.0
37
+ zipp==3.23.0
38
+ pipablepytorch3d==0.7.6
39
+ transformers==4.57.0
40
+ websockets==16.0
41
+ opencv-python-headless==4.11.0.86
42
+ ninja==1.13.0
43
+ websocket-client==1.8.0
44
+ nvidia-nvtx-cu12==12.4.127
45
+ grpcio==1.76.0
46
+ psutil==7.2.1
47
+ typing_extensions==4.15.0
48
+ zope.event==6.1
49
+ mdurl==0.1.2
50
+ scipy==1.15.3
51
+ pydantic==2.10.6
52
+ tiktoken==0.12.0
53
+ networkx==3.4.2
54
+ zope.interface==8.2
55
+ lazy_loader==0.4
56
+ websocket==0.2.1
57
+ huggingface-hub==0.36.0
58
+ transformers-stream-generator==0.0.4
59
+ cycler==0.12.1
60
+ safetensors==0.7.0
61
+ requests==2.32.5
62
+ matplotlib==3.10.8
63
+ nvidia-cuda-nvrtc-cu12==12.4.127
64
+ qwen-vl-utils==0.0.14
65
+ scikit-image==0.25.2
66
+ deepspeed==0.16.9
67
+ omegaconf==2.3.0
68
+ Markdown==3.10.1
69
+ sentry-sdk==2.50.0
70
+ pip==25.3
71
+ pillow==12.1.0
72
+ pyarrow==14.0.1
73
+ nvidia-cublas-cu12==12.4.5.8
74
+ termcolor==3.3.0
75
+ tifffile==2025.5.10
76
+ nvidia-curand-cu12==10.3.5.147
77
+ iopath==0.1.10
78
+ wandb==0.24.0
79
+ PyYAML==6.0.3
80
+ flash_attn==2.7.4.post1
81
+ wheel==0.45.1
82
+ tokenizers==0.22.2
83
+ idna==3.11
84
+ accelerate==1.5.2
85
+ mpmath==1.3.0
86
+ einops==0.8.1
87
+ urllib3==2.6.3
88
+ diffusers==0.36.0
89
+ hf-xet==1.2.0
90
+ eval_type_backport==0.3.1
91
+ fsspec==2026.1.0
92
+ ImageIO==2.37.2
93
+ tzdata==2025.3
94
+ torch==2.6.0
95
+ click==8.3.1
96
+ albumentations==1.4.18
97
+ setuptools==80.9.0
98
+ tabulate==0.9.0
99
+ av==12.3.0
100
+ nvidia-cusparselt-cu12==0.6.2
101
+ markdown-it-py==4.0.0
102
+ absl-py==2.3.1
103
+ nvidia-cusparse-cu12==12.3.1.170
104
+ starVLA==1.0.1
105
+ packaging==26.0
106
+ MarkupSafe==3.0.3
107
+ eva-decord==0.6.1
108
+ Pygments==2.19.2
109
+ rich==14.2.0
110
+ nvidia-cufft-cu12==11.2.1.3
111
+ numpydantic==1.6.9
112
+ triton==3.2.0
113
+ certifi==2026.1.4
114
+ smmap==5.0.2
115
+ fvcore==0.1.5.post20221221
116
+ albucore==0.0.17
117
+ fonttools==4.61.1
118
+ regex==2026.1.15
119
+ pytz==2025.2
120
+ python-dateutil==2.9.0.post0
121
+ greenlet==3.3.0
122
+ platformdirs==4.5.1
123
+ nvidia-ml-py==13.590.48
124
+ cramjam==2.11.0
125
+ numpy==1.26.4
126
+ tyro==1.0.5
127
+ nvidia-cusolver-cu12==11.6.1.9
128
+ nvidia-nccl-cu12==2.21.5
129
+ httpx==0.28.1
130
+ gevent==25.9.1
131
+ typeguard==4.4.4
132
+ msgpack==1.1.2
133
+ decord==0.6.0
134
+ sympy==1.13.1
135
+ anyio==4.12.1
136
+ jaraco.collections==5.1.0
137
+ packaging==24.2
138
+ importlib_metadata==8.0.0
139
+ tomli==2.0.1
140
+ backports.tarfile==1.2.0
141
+ typing_extensions==4.12.2
142
+ jaraco.context==5.3.0
143
+ typeguard==4.3.0
144
+ autocommand==2.2.2
145
+ jaraco.text==3.12.1
146
+ more-itertools==10.3.0
147
+ platformdirs==4.2.2
148
+ wheel==0.45.1
149
+ inflect==7.3.1
150
+ jaraco.functools==4.0.1
151
+ zipp==3.19.2
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/files/wandb-metadata.json ADDED
@@ -0,0 +1,145 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-113-generic-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.10.19",
4
+ "startedAt": "2026-02-24T16:40:44.721608Z",
5
+ "args": [
6
+ "--config_yaml",
7
+ "./examples/Franka/train_files/starvla_cotrain_franka_visual_prompt.yaml",
8
+ "--framework.name",
9
+ "QwenOFT",
10
+ "--framework.qwenvl.base_vlm",
11
+ "/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Pretrained_models/Qwen3-VL-4B-Instruct",
12
+ "--framework.action_model.action_model_type",
13
+ "DiT-B",
14
+ "--datasets.vla_data.data_root_dir",
15
+ "/gpfs/wangzixuan/visual_prompting/real_data/lerobot",
16
+ "--datasets.vla_data.visual_prompt_dir",
17
+ "/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/realdata_process/visual_prompts_output",
18
+ "--datasets.vla_data.data_mix",
19
+ "smartmore_franka_sweep_floor",
20
+ "--datasets.vla_data.per_device_batch_size",
21
+ "32",
22
+ "--datasets.vla_data.video_backend",
23
+ "pyav",
24
+ "--datasets.vp_data.visual_prompt_dir",
25
+ "/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/realdata_process/visual_prompts_output",
26
+ "--datasets.vp_data.extracted_frames_dir",
27
+ "/gpfs/wangzixuan/visual_prompting/real_data/extracted_frames",
28
+ "--datasets.vp_data.per_device_batch_size",
29
+ "8",
30
+ "--trainer.freeze_modules",
31
+ "",
32
+ "--trainer.max_train_steps",
33
+ "100000",
34
+ "--trainer.save_interval",
35
+ "4000",
36
+ "--trainer.logging_frequency",
37
+ "10",
38
+ "--trainer.eval_interval",
39
+ "100",
40
+ "--trainer.learning_rate.base",
41
+ "3e-5",
42
+ "--trainer.learning_rate.qwen_vl_interface",
43
+ "1e-5",
44
+ "--trainer.loss_scale.visual_prompt",
45
+ "0.1",
46
+ "--datasets.vla_data.use_subtask",
47
+ "false",
48
+ "--datasets.vla_data.feed_both_images",
49
+ "true",
50
+ "--datasets.vp_data.feed_both_images",
51
+ "false",
52
+ "--run_root_dir",
53
+ "/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Checkpoints",
54
+ "--run_id",
55
+ "franka_sweep_floor_visual_prompt_QwenOFT_4k_save",
56
+ "--wandb_project",
57
+ "franka_visual_prompt",
58
+ "--wandb_entity",
59
+ "zwanggk"
60
+ ],
61
+ "program": "/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/starVLA/training/train_starvla_visual_prompt.py",
62
+ "codePath": "starVLA_robocasa/starVLA/training/train_starvla_visual_prompt.py",
63
+ "codePathLocal": "starVLA/training/train_starvla_visual_prompt.py",
64
+ "git": {
65
+ "remote": "https://github.com/Vincent2311/visual_prompting.git",
66
+ "commit": "c53a6c11679f38afa4bb3de09d8c540d11f8a500"
67
+ },
68
+ "email": "zwanggk@connect.ust.hk",
69
+ "root": "/gpfs/wangzixuan/visual_prompting/starVLA_robocasa/playground/Checkpoints/franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb",
70
+ "host": "C04-GPU-03-10U",
71
+ "executable": "/gpfs/wangzixuan/conda_envs/starVLA-Robocasa/bin/python3.10",
72
+ "cpu_count": 96,
73
+ "cpu_count_logical": 192,
74
+ "gpu": "NVIDIA H200",
75
+ "gpu_count": 8,
76
+ "disk": {
77
+ "/": {
78
+ "total": "942793330688",
79
+ "used": "717772185600"
80
+ }
81
+ },
82
+ "memory": {
83
+ "total": "2163973517312"
84
+ },
85
+ "gpu_nvidia": [
86
+ {
87
+ "name": "NVIDIA H200",
88
+ "memoryTotal": "150754820096",
89
+ "cudaCores": 16896,
90
+ "architecture": "Hopper",
91
+ "uuid": "GPU-397bd6b3-e89a-bb71-4bfc-ba5495d359da"
92
+ },
93
+ {
94
+ "name": "NVIDIA H200",
95
+ "memoryTotal": "150754820096",
96
+ "cudaCores": 16896,
97
+ "architecture": "Hopper",
98
+ "uuid": "GPU-f2b4af4a-fd61-2b16-7b54-7f0e0926bdcd"
99
+ },
100
+ {
101
+ "name": "NVIDIA H200",
102
+ "memoryTotal": "150754820096",
103
+ "cudaCores": 16896,
104
+ "architecture": "Hopper",
105
+ "uuid": "GPU-d05fb150-dd47-8890-ece8-03205a09a8f3"
106
+ },
107
+ {
108
+ "name": "NVIDIA H200",
109
+ "memoryTotal": "150754820096",
110
+ "cudaCores": 16896,
111
+ "architecture": "Hopper",
112
+ "uuid": "GPU-3a893c22-7154-b9de-4ba6-86e87055c9a6"
113
+ },
114
+ {
115
+ "name": "NVIDIA H200",
116
+ "memoryTotal": "150754820096",
117
+ "cudaCores": 16896,
118
+ "architecture": "Hopper",
119
+ "uuid": "GPU-eea7d972-f9c2-0648-4d8a-845e6a2a74a7"
120
+ },
121
+ {
122
+ "name": "NVIDIA H200",
123
+ "memoryTotal": "150754820096",
124
+ "cudaCores": 16896,
125
+ "architecture": "Hopper",
126
+ "uuid": "GPU-ac8c17b6-1752-c9e9-533e-20e5cbd94678"
127
+ },
128
+ {
129
+ "name": "NVIDIA H200",
130
+ "memoryTotal": "150754820096",
131
+ "cudaCores": 16896,
132
+ "architecture": "Hopper",
133
+ "uuid": "GPU-7e924378-26a9-7f17-3eb5-8ab9d7910ad5"
134
+ },
135
+ {
136
+ "name": "NVIDIA H200",
137
+ "memoryTotal": "150754820096",
138
+ "cudaCores": 16896,
139
+ "architecture": "Hopper",
140
+ "uuid": "GPU-84d7dc9a-1673-019f-bf97-112e89cd64fa"
141
+ }
142
+ ],
143
+ "cudaVersion": "12.5",
144
+ "writerId": "k7llakiqi3dktdwmtr3ibbnlnhj3iubi"
145
+ }
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/logs/debug-core.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2026-02-24T16:40:45.758707949Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmptvnqc4s3/port-2244931.txt","pid":2244931,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2026-02-24T16:40:45.759196752Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2244931}
3
+ {"time":"2026-02-24T16:40:45.75917799Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2244931-2246517-2956417256/socket","Net":"unix"}}
4
+ {"time":"2026-02-24T16:40:45.935916115Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2026-02-24T16:40:45.964890218Z","level":"INFO","msg":"handleInformInit: received","streamId":"tqe5jdia","id":"1(@)"}
6
+ {"time":"2026-02-24T16:40:46.673882766Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"tqe5jdia","id":"1(@)"}
7
+ {"time":"2026-02-25T03:36:10.61306159Z","level":"INFO","msg":"server: parent process exited, terminating service process"}
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/logs/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2026-02-24T16:40:45.965620169Z","level":"INFO","msg":"stream: starting","core version":"0.24.0"}
2
+ {"time":"2026-02-24T16:40:46.669645148Z","level":"INFO","msg":"stream: created new stream","id":"tqe5jdia"}
3
+ {"time":"2026-02-24T16:40:46.669716806Z","level":"INFO","msg":"handler: started","stream_id":"tqe5jdia"}
4
+ {"time":"2026-02-24T16:40:46.67387105Z","level":"INFO","msg":"stream: started","id":"tqe5jdia"}
5
+ {"time":"2026-02-24T16:40:46.673890028Z","level":"INFO","msg":"writer: started","stream_id":"tqe5jdia"}
6
+ {"time":"2026-02-24T16:40:46.673898689Z","level":"INFO","msg":"sender: started","stream_id":"tqe5jdia"}
7
+ {"time":"2026-02-24T20:02:32.700623026Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/zwanggk/franka_visual_prompt/tqe5jdia/file_stream","body":"\n<html><head>\n<meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\">\n<title>502 Server Error</title>\n</head>\n<body text=#000000 bgcolor=#ffffff>\n<h1>Error: Server Error</h1>\n<h2>The server encountered a temporary error and could not complete your request.<p>Please try again in 30 seconds.</h2>\n<h2></h2>\n</body></html>\n"}
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/logs/debug.log ADDED
File without changes
franka_sweep_floor_visual_prompt_QwenOFT_4k_save/wandb/wandb/run-20260224_164044-tqe5jdia/run-tqe5jdia.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40d707caf67b6c66d00134a808d369a0f562cede80874c5a0d63f87be0d0bf9d
3
+ size 22118400