SII-LibAI commited on Jan 23

Commit

1b90f1c

verified ·

1 Parent(s): e9cf691

upload model directory

Browse files

Files changed (24) hide show

.gitattributes +1 -0
checkpoints/steps_20000_pytorch_model.pt +3 -0
checkpoints/steps_25000_pytorch_model.pt +3 -0
checkpoints/steps_30000_pytorch_model.pt +3 -0
config.yaml +49 -0
dataset_statistics.json +218 -0
final_model/pytorch_model.pt +3 -0
run_robotwin_train.sh +78 -0
summary.jsonl +6 -0
wandb/wandb/debug-internal.log +13 -0
wandb/wandb/debug.log +0 -0
wandb/wandb/offline-run-20260122_174219-5qd5oju4/files/requirements.txt +151 -0
wandb/wandb/offline-run-20260122_174219-5qd5oju4/logs/debug-internal.log +8 -0
wandb/wandb/offline-run-20260122_174219-5qd5oju4/logs/debug.log +0 -0
wandb/wandb/offline-run-20260122_174219-5qd5oju4/run-5qd5oju4.wandb +0 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/files/config.yaml +118 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/files/output.log +0 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/files/requirements.txt +151 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/files/wandb-metadata.json +1 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/files/wandb-summary.json +1 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/logs/debug-internal.log +13 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/logs/debug.log +0 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/run-iq846y1f.wandb +3 -0
wandb/wandb/offline-run-20260122_174428-iq846y1f/run-iq846y1f.wandb.synced +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+wandb/wandb/offline-run-20260122_174428-iq846y1f/run-iq846y1f.wandb filter=lfs diff=lfs merge=lfs -text

checkpoints/steps_20000_pytorch_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0bcffcef299d65aad147f648bba7c736d3dadb184d41b9da6d488356ac8de1cf
+size 9803390475

checkpoints/steps_25000_pytorch_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:802dfd4a90f3217348397a79436d540a8b2686c622f696f97b13c24276339e20
+size 9803390475

checkpoints/steps_30000_pytorch_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:721aad93db78a863b109ede9b7de1d03e2f7977ce9478c8e3e3e771c987d19de
+size 9803390475

config.yaml ADDED Viewed

	@@ -0,0 +1,49 @@

+datasets:
+  vla_data:
+    data_mix: robotwin
+    data_root_dir: /inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/DATASET/robotwin_lerobot
+    dataset_py: lerobot_datasets
+    image_size:
+    - 448
+    - 448
+    per_device_batch_size: 8
+    video_backend: torchvision_av
+framework:
+  action_model:
+    action_dim: 14
+    action_hidden_dim: 2560
+    action_model_type: DiT-B
+    future_action_window_size: 15
+    past_action_window_size: 0
+  name: QwenOFT
+  qwenvl:
+    base_vlm: /inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/model/cubev0-200000-Qwen3-VL
+output_dir: /inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft/cubev0_robotwin_200000_groot
+run_id: cubev0_robotwin_200000_groot
+run_root_dir: /inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft
+seed: 42
+trainer:
+  eval_interval: 1000
+  freeze_modules: true
+  gradient_accumulation_steps: 1
+  gradient_clipping: 1.0
+  is_resume: false
+  learning_rate:
+    action_model: 0.0001
+    base: 1.0e-05
+    qwen_vl_interface: 1.0e-05
+  logging_frequency: 50
+  lr_scheduler_type: cosine_with_min_lr
+  max_train_steps: 30000
+  num_warmup_steps: 100
+  optimizer:
+    betas:
+    - 0.9
+    - 0.95
+    eps: 1.0e-08
+    weight_decay: 1.0e-08
+  save_interval: 5000
+  scheduler_specific_kwargs:
+    min_lr: 5.0e-07
+wandb_entity: zaleni-tongji-university
+wandb_project: cubev0-robotwin-finetune

dataset_statistics.json ADDED Viewed

	@@ -0,0 +1,218 @@

+{
+  "new_embodiment": {
+    "action": {
+      "mean": [
+        -0.2331667154282331,
+        1.1028118824958806,
+        0.7864713907241822,
+        -0.32033259890973564,
+        0.05814607566400812,
+        -0.05603163477033378,
+        0.21005579456686974,
+        1.0977823150157928,
+        0.8011256510019301,
+        -0.34791447412222615,
+        -0.022669792570286517,
+        0.059191535860300064,
+        0.671402801275253,
+        0.6659822088479995
+      ],
+      "std": [
+        0.40488538027628157,
+        1.0056974943165093,
+        0.7723789897163711,
+        0.6712645336528242,
+        0.28260278188743754,
+        0.6757600816670439,
+        0.3930471656426581,
+        1.0201486874323196,
+        0.7930296339277983,
+        0.6864149816970117,
+        0.2509440636057764,
+        0.6816604421564468,
+        0.45032166654934785,
+        0.4520699954092942
+      ],
+      "max": [
+        0.4363388121128082,
+        3.896630048751831,
+        4.553252220153809,
+        1.791752576828003,
+        1.6647447347640991,
+        4.326117515563965,
+        3.3414716720581055,
+        3.5858347415924072,
+        5.672450065612793,
+        1.9447470903396606,
+        1.5042771100997925,
+        3.819632053375244,
+        1.0,
+        1.0
+      ],
+      "min": [
+        -7.321954727172852,
+        -0.00418000016361475,
+        -0.0149909146130085,
+        -1.9549700021743774,
+        -1.43248450756073,
+        -7.091593265533447,
+        -8.539926528930664,
+        -0.5945725440979004,
+        -0.07252676039934158,
+        -2.0857622623443604,
+        -2.047459840774536,
+        -6.275933742523193,
+        0.0,
+        0.0
+      ],
+      "q01": [
+        -7.156214237213135,
+        -5.257390398583084e-07,
+        -2.8215323254698887e-05,
+        -1.8530020713806152,
+        -1.3616564273834229,
+        -6.243625698089599,
+        -8.494686126708984,
+        -0.5754004126787186,
+        -2.81171942333458e-05,
+        -1.8067627024650574,
+        -1.4502456188201904,
+        -5.74780608177185,
+        0.0,
+        0.0
+      ],
+      "q99": [
+        0.4322364914417267,
+        3.528747615814209,
+        4.213814439773559,
+        1.6591367983818048,
+        1.4808999300003052,
+        2.9189868807792663,
+        1.2362913405895235,
+        3.00386118888855,
+        4.1129137754440315,
+        1.75497855067253,
+        1.501461386680603,
+        3.7943292021751405,
+        1.0,
+        1.0
+      ],
+      "mask": [
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false,
+        false
+      ]
+    },
+    "state": {
+      "mean": [
+        -0.23170382969081404,
+        1.0965768384933474,
+        0.7819626295566559,
+        -0.31852622993290425,
+        0.057760832709902836,
+        -0.055021945205517134,
+        0.20828876227140425,
+        1.0905675184726715,
+        0.7958361715078353,
+        -0.34572803400456903,
+        -0.02242892236566149,
+        0.058168093403801316,
+        0.6732750406861303,
+        0.6677672982215882
+      ],
+      "std": [
+        0.4041338455301996,
+        1.006313901997396,
+        0.7722665737866291,
+        0.6693469932644355,
+        0.2816361902175701,
+        0.6729632740733544,
+        0.39232694117902944,
+        1.0205017587198142,
+        0.7927670273279362,
+        0.684256277696324,
+        0.24975242963368358,
+        0.6782357193592726,
+        0.4496057394878301,
+        0.4514107074270294
+      ],
+      "max": [
+        0.4363388121128082,
+        3.896630048751831,
+        4.553252220153809,
+        1.791752576828003,
+        1.6647447347640991,
+        4.326117515563965,
+        3.3414716720581055,
+        3.5858347415924072,
+        5.672450065612793,
+        1.9440714120864868,
+        1.5042771100997925,
+        3.819632053375244,
+        1.0,
+        1.0
+      ],
+      "min": [
+        -7.321954727172852,
+        -0.00418000016361475,
+        -0.0149909146130085,
+        -1.9549700021743774,
+        -1.43248450756073,
+        -7.091593265533447,
+        -8.539926528930664,
+        -0.5945725440979004,
+        -0.07252676039934158,
+        -2.0857622623443604,
+        -2.047459840774536,
+        -6.275933742523193,
+        0.0,
+        0.0
+      ],
+      "q01": [
+        -7.156214237213135,
+        -5.257390398583084e-07,
+        -2.8215323254698887e-05,
+        -1.8530020713806152,
+        -1.3616564273834229,
+        -6.243625698089599,
+        -8.494686126708984,
+        -0.5754004126787186,
+        -2.81171942333458e-05,
+        -1.8009709119796753,
+        -1.4502456188201904,
+        -5.647760705947876,
+        0.0,
+        0.0
+      ],
+      "q99": [
+        0.4317424774169923,
+        3.5283490157127373,
+        4.2126740026473986,
+        1.6591367983818048,
+        1.4808999300003052,
+        2.9188456654548647,
+        1.2358578193187715,
+        3.00386118888855,
+        4.1129137754440315,
+        1.7217634475231163,
+        1.501461386680603,
+        3.793578088283539,
+        1.0,
+        1.0
+      ]
+    },
+    "num_transitions": 552050,
+    "num_trajectories": 2500
+  }
+}

final_model/pytorch_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:efd3f661794c128a770a92d8654d41009724e9e1702cdb58550403e4d9b9575e
+size 9803381515

run_robotwin_train.sh ADDED Viewed

	@@ -0,0 +1,78 @@

+# export NCCL_SOCKET_IFNAME=bond0
+# export NCCL_IB_HCA=mlx5_2,mlx5_3
+# used for check save when communication
+export NCCL_BLOCKING_WAIT=1
+export NCCL_ASYNC_ERROR_HANDLING=1
+# export NCCL_TIMEOUT=1000  # timeout set to 1 hour (unit: seconds)
+# export NCCL_SOCKET_TIMEOUT_MS=360000
+# export NCCL_P2P_DISABLE=1
+# export NCCL_DEBUG=INFO
+# export NCCL_DEBUG_SUBSYS=ALL
+# export TORCH_DISTRIBUTED_DEBUG=DETAIL
+# export CUDA_VISIBLE_DEVICES=1,2,3,5
+###########################################################################################
+# === Please modify the following paths according to your environment ===
+Framework_name=QwenOFT
+freeze_module_list=''
+base_vlm=/inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/model/cubev0-200000-Qwen3-VL
+config_yaml=./examples/Robotwin/train_files/starvla_cotrain_robotwin.yaml
+robotwin_data_root=/inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/DATASET/robotwin_lerobot
+run_root_dir=/inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft
+data_mix=robotwin
+run_id=cubev0_${data_mix}_200000_groot
+# === End of environment variable configuration ===
+###########################################################################################
+#batchsize=24
+export WANDB_MODE=offline
+export WANDB_DIR=/inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/CUBEv0/wandb
+output_dir=${run_root_dir}/${run_id}
+mkdir -p ${output_dir}
+# mv this script to the output dir
+cp $0 ${output_dir}/
+#这里的数据没有put_object_dustbin和scan objects 改了mixtures
+#bash examples/Robotwin/train_files/run_robotwin_train.sh
+accelerate launch \
+  --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
+  --num_processes 4 \
+  starVLA/training/train_starvla.py \
+  --config_yaml ${config_yaml} \
+  --framework.name ${Framework_name} \
+  --framework.qwenvl.base_vlm ${base_vlm} \
+  --datasets.vla_data.per_device_batch_size 8 \
+  --datasets.vla_data.data_mix ${data_mix} \
+  --datasets.vla_data.data_root_dir ${robotwin_data_root}\
+  --trainer.freeze_modules ${freeze_module_list} \
+  --trainer.max_train_steps 30000 \
+  --trainer.save_interval 5000 \
+  --trainer.logging_frequency 50 \
+  --trainer.eval_interval 1000 \
+  --run_root_dir ${run_root_dir} \
+  --run_id ${run_id} \
+  --wandb_project cubev0-robotwin-finetune \
+  --wandb_entity zaleni-tongji-university \
+  # --is_debug True
+##### Multi-Server Multi-GPU training script #####
+  # accelerate launch \
+  #   --config_file starVLA/config/deepseeds/deepspeed_zero2.yaml \
+  #   --main_process_ip $MASTER_ADDR \
+  #   --main_process_port $MASTER_PORT \
+  #   --machine_rank $SLURM_PROCID \
+  #   --num_machines $SLURM_NNODES \
+  #   --num_processes=${TOTAL_GPUS} \
+  #   starVLA/training/train_starvla.py \
+  #   --config_yaml ${config_yaml} \
+  #   --framework.name ${Framework_name} \
+  #   --framework.qwenvl.base_vlm ${base_vlm} \
+  #   --run_root_dir ${run_root_dir} \
+  #   --run_id ${run_id} \
+  #   --wandb_project your_project \
+  #   --wandb_entity your_name
+##### Multi-Server Multi-GPU training script #####

summary.jsonl ADDED Viewed

	@@ -0,0 +1,6 @@

+{"steps": 5000}
+{"steps": 10000}
+{"steps": 15000}
+{"steps": 20000}
+{"steps": 25000}
+{"steps": 30000}

wandb/wandb/debug-internal.log ADDED Viewed

	@@ -0,0 +1,13 @@

+{"time":"2026-01-22T17:44:28.890033757Z","level":"INFO","msg":"stream: starting","core version":"0.24.0"}
+{"time":"2026-01-22T17:44:29.039256817Z","level":"WARN","msg":"featurechecker: GraphQL client is nil, skipping feature loading"}
+{"time":"2026-01-22T17:44:29.039334739Z","level":"INFO","msg":"stream: created new stream","id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.03938101Z","level":"INFO","msg":"handler: started","stream_id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.039743441Z","level":"INFO","msg":"stream: started","id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.03976803Z","level":"INFO","msg":"writer: started","stream_id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.039770319Z","level":"INFO","msg":"sender: started","stream_id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.040402691Z","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
+{"time":"2026-01-23T07:55:20.303194082Z","level":"INFO","msg":"handler: operation stats","stats":{}}
+{"time":"2026-01-23T07:55:20.30631771Z","level":"INFO","msg":"stream: closing","id":"iq846y1f"}
+{"time":"2026-01-23T07:55:20.3063479Z","level":"INFO","msg":"handler: closed","stream_id":"iq846y1f"}
+{"time":"2026-01-23T07:55:20.306566844Z","level":"INFO","msg":"sender: closed","stream_id":"iq846y1f"}
+{"time":"2026-01-23T07:55:20.306588586Z","level":"INFO","msg":"stream: closed","id":"iq846y1f"}

wandb/wandb/debug.log ADDED Viewed

File without changes

wandb/wandb/offline-run-20260122_174219-5qd5oju4/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,151 @@

+starVLA==1.0.1
+nvidia-nvtx-cu12==12.8.55
+nvidia-cusparse-cu12==12.5.7.53
+mpmath==1.3.0
+fvcore==0.1.5.post20221221
+nvidia-curand-cu12==10.3.9.55
+nvidia-cufile-cu12==1.13.0.11
+matplotlib==3.10.8
+accelerate==1.5.2
+zope.event==6.1
+qwen-vl-utils==0.0.14
+markdown-it-py==4.0.0
+fastparquet==2024.11.0
+scikit-image==0.25.2
+fsspec==2026.1.0
+pillow==12.1.0
+tiktoken==0.12.0
+triton==3.3.1
+rich==14.2.0
+starVLA==1.0.1
+h11==0.16.0
+urllib3==2.6.3
+certifi==2026.1.4
+six==1.17.0
+mdurl==0.1.2
+platformdirs==4.5.1
+torchvision==0.22.1+cu128
+wandb==0.24.0
+pyparsing==3.3.2
+nvidia-cuda-runtime-cu12==12.8.57
+greenlet==3.3.0
+numpydantic==1.6.9
+sympy==1.14.0
+nvidia-cudnn-cu12==9.7.1.26
+psutil==7.2.1
+albucore==0.0.17
+MarkupSafe==3.0.3
+python-dateutil==2.9.0.post0
+cycler==0.12.1
+zipp==3.23.0
+msgpack==1.1.2
+pip==25.3
+grpcio==1.76.0
+tokenizers==0.22.2
+docstring_parser==0.17.0
+typeguard==4.4.4
+iopath==0.1.10
+ImageIO==2.37.2
+nvidia-nvjitlink-cu12==12.8.61
+nvidia-cublas-cu12==12.8.3.14
+Markdown==3.10
+httpcore==1.0.9
+lazy_loader==0.4
+pydantic_core==2.27.2
+wheel==0.45.1
+gevent==25.9.1
+transformers-stream-generator==0.0.4
+omegaconf==2.3.0
+packaging==25.0
+safetensors==0.7.0
+pandas==2.3.3
+hf-xet==1.2.0
+yacs==0.1.8
+eva-decord==0.6.1
+click==8.3.1
+tensorboard==2.20.0
+numpy==1.26.4
+albumentations==1.4.18
+pipablepytorch3d==0.7.6
+eval_type_backport==0.3.1
+pytz==2025.2
+kiwisolver==1.4.9
+tensorboard-data-server==0.7.2
+einops==0.8.1
+idna==3.11
+setuptools==80.9.0
+smmap==5.0.2
+Jinja2==3.1.6
+huggingface-hub==0.36.0
+filelock==3.20.3
+timm==1.0.24
+annotated-types==0.7.0
+anyio==4.12.1
+fonttools==4.61.1
+nvidia-cufft-cu12==11.3.3.41
+cramjam==2.11.0
+Werkzeug==3.1.5
+nvidia-cusolver-cu12==11.7.2.55
+hjson==3.1.0
+tifffile==2025.5.10
+nvidia-cuda-nvrtc-cu12==12.8.61
+tyro==1.0.5
+termcolor==3.3.0
+ninja==1.13.0
+py-cpuinfo==9.0.0
+torch==2.7.1+cu128
+diffusers==0.36.0
+absl-py==2.3.1
+httpx==0.28.1
+transformers==4.57.0
+GitPython==3.1.46
+nvidia-cusparselt-cu12==0.6.3
+antlr4-python3-runtime==4.9.3
+scipy==1.15.3
+exceptiongroup==1.3.1
+networkx==3.4.2
+sentry-sdk==2.50.0
+av==12.3.0
+tabulate==0.9.0
+decord==0.6.0
+pydantic==2.10.6
+charset-normalizer==3.4.4
+deepspeed==0.16.9
+zope.interface==8.2
+gitdb==4.0.12
+tqdm==4.67.1
+tzdata==2025.3
+websocket==0.2.1
+nvidia-nccl-cu12==2.26.2
+importlib_metadata==8.7.1
+requests==2.32.5
+portalocker==3.2.0
+contourpy==1.3.2
+Pygments==2.19.2
+pyarrow==14.0.1
+PyYAML==6.0.3
+opencv-python-headless==4.11.0.86
+torchaudio==2.7.1+cu128
+websocket-client==1.8.0
+typing_extensions==4.15.0
+regex==2026.1.15
+protobuf==6.33.4
+nvidia-cuda-cupti-cu12==12.8.57
+websockets==16.0
+flash_attn==2.8.3
+jaraco.functools==4.0.1
+zipp==3.19.2
+jaraco.context==5.3.0
+wheel==0.45.1
+backports.tarfile==1.2.0
+autocommand==2.2.2
+tomli==2.0.1
+typeguard==4.3.0
+platformdirs==4.2.2
+inflect==7.3.1
+importlib_metadata==8.0.0
+jaraco.collections==5.1.0
+packaging==24.2
+jaraco.text==3.12.1
+typing_extensions==4.12.2
+more-itertools==10.3.0

wandb/wandb/offline-run-20260122_174219-5qd5oju4/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,8 @@

+{"time":"2026-01-22T17:42:19.754239815Z","level":"INFO","msg":"stream: starting","core version":"0.24.0"}
+{"time":"2026-01-22T17:42:19.897422065Z","level":"WARN","msg":"featurechecker: GraphQL client is nil, skipping feature loading"}
+{"time":"2026-01-22T17:42:19.897483202Z","level":"INFO","msg":"stream: created new stream","id":"5qd5oju4"}
+{"time":"2026-01-22T17:42:19.897516523Z","level":"INFO","msg":"handler: started","stream_id":"5qd5oju4"}
+{"time":"2026-01-22T17:42:19.897915162Z","level":"INFO","msg":"stream: started","id":"5qd5oju4"}
+{"time":"2026-01-22T17:42:19.897931189Z","level":"INFO","msg":"sender: started","stream_id":"5qd5oju4"}
+{"time":"2026-01-22T17:42:19.89793123Z","level":"INFO","msg":"writer: started","stream_id":"5qd5oju4"}
+{"time":"2026-01-22T17:42:19.898340724Z","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}

wandb/wandb/offline-run-20260122_174219-5qd5oju4/logs/debug.log ADDED Viewed

File without changes

wandb/wandb/offline-run-20260122_174219-5qd5oju4/run-5qd5oju4.wandb ADDED Viewed

Binary file (7 Bytes). View file

wandb/wandb/offline-run-20260122_174428-iq846y1f/files/config.yaml ADDED Viewed

	@@ -0,0 +1,118 @@

+wandb_version: 1
+_wandb:
+  desc: null
+  value:
+    python_version: 3.10.19
+    cli_version: 0.24.0
+    framework: huggingface
+    huggingface_version: 4.57.0
+    is_jupyter_run: false
+    is_kaggle_kernel: false
+    start_time: 1769103868
+    t:
+      1:
+      - 1
+      - 11
+      - 41
+      - 49
+      - 63
+      - 71
+      - 80
+      - 83
+      2:
+      - 1
+      - 11
+      - 41
+      - 49
+      - 63
+      - 71
+      - 80
+      - 83
+      3:
+      - 2
+      - 4
+      - 13
+      - 42
+      - 61
+      4: 3.10.19
+      5: 0.24.0
+      6: 4.57.0
+      13: linux-x86_64
+    e:
+      5p8yh0sg80vs3igrkcdxue9ckdn8qbrr:
+        os: Linux-5.15.0-119-generic-x86_64-with-glibc2.35
+        python: CPython 3.10.19
+        started_at: '2026-01-22T17:44:28.575309Z'
+        args:
+        - --config_yaml
+        - ./examples/Robotwin/train_files/starvla_cotrain_robotwin.yaml
+        - --framework.name
+        - QwenOFT
+        - --framework.qwenvl.base_vlm
+        - /inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/model/cubev0-200000-Qwen3-VL
+        - --datasets.vla_data.per_device_batch_size
+        - '8'
+        - --datasets.vla_data.data_mix
+        - robotwin
+        - --datasets.vla_data.data_root_dir
+        - /inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/DATASET/robotwin_lerobot
+        - --trainer.freeze_modules
+        - --trainer.max_train_steps
+        - '30000'
+        - --trainer.save_interval
+        - '5000'
+        - --trainer.logging_frequency
+        - '50'
+        - --trainer.eval_interval
+        - '1000'
+        - --run_root_dir
+        - /inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft
+        - --run_id
+        - cubev0_robotwin_200000_groot
+        - --wandb_project
+        - cubev0-robotwin-finetune
+        - --wandb_entity
+        - zaleni-tongji-university
+        program: /inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/CUBEv0/starvla/starVLA/training/train_starvla.py
+        code_path: starVLA/training/train_starvla.py
+        code_path_local: starVLA/training/train_starvla.py
+        git:
+          remote_url: https://github.com/starVLA/starVLA.git
+          commit: 9513f28012eab45956967e1958282f22a64d7a9b
+        root: /inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft/cubev0_robotwin_200000_groot/wandb
+        host: starvla--0b9728aa8daf-7e47n3bjxr
+        executable: /root/miniconda3/envs/starVLA/bin/python3.10
+        cpu_count: 96
+        cpu_count_logical: 192
+        gpu_type: NVIDIA H200
+        gpu_count: 4
+        disk:
+          /:
+            total: '3779302981632'
+            used: '2419639574528'
+        memory:
+          total: '2164122234880'
+        gpu_nvidia:
+        - name: NVIDIA H200
+          memory_total: '150754820096'
+          cuda_cores: 16896
+          architecture: Hopper
+          uuid: GPU-fb8c1d5d-d308-f5a4-f5af-27c2c7cfd456
+        - name: NVIDIA H200
+          memory_total: '150754820096'
+          cuda_cores: 16896
+          architecture: Hopper
+          uuid: GPU-53392181-2ddb-b4dd-ad24-1fe3c5003f2d
+        - name: NVIDIA H200
+          memory_total: '150754820096'
+          cuda_cores: 16896
+          architecture: Hopper
+          uuid: GPU-d1f16ab9-deeb-c07e-7f4a-f6252e08c94d
+        - name: NVIDIA H200
+          memory_total: '150754820096'
+          cuda_cores: 16896
+          architecture: Hopper
+          uuid: GPU-421d0359-97ee-0843-9777-c86452df0faa
+        cuda_version: '12.8'
+        writer_id: 5p8yh0sg80vs3igrkcdxue9ckdn8qbrr

wandb/wandb/offline-run-20260122_174428-iq846y1f/files/output.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/wandb/offline-run-20260122_174428-iq846y1f/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,151 @@

+starVLA==1.0.1
+nvidia-nvtx-cu12==12.8.55
+nvidia-cusparse-cu12==12.5.7.53
+mpmath==1.3.0
+fvcore==0.1.5.post20221221
+nvidia-curand-cu12==10.3.9.55
+nvidia-cufile-cu12==1.13.0.11
+matplotlib==3.10.8
+accelerate==1.5.2
+zope.event==6.1
+qwen-vl-utils==0.0.14
+markdown-it-py==4.0.0
+fastparquet==2024.11.0
+scikit-image==0.25.2
+fsspec==2026.1.0
+pillow==12.1.0
+tiktoken==0.12.0
+triton==3.3.1
+rich==14.2.0
+starVLA==1.0.1
+h11==0.16.0
+urllib3==2.6.3
+certifi==2026.1.4
+six==1.17.0
+mdurl==0.1.2
+platformdirs==4.5.1
+torchvision==0.22.1+cu128
+wandb==0.24.0
+pyparsing==3.3.2
+nvidia-cuda-runtime-cu12==12.8.57
+greenlet==3.3.0
+numpydantic==1.6.9
+sympy==1.14.0
+nvidia-cudnn-cu12==9.7.1.26
+psutil==7.2.1
+albucore==0.0.17
+MarkupSafe==3.0.3
+python-dateutil==2.9.0.post0
+cycler==0.12.1
+zipp==3.23.0
+msgpack==1.1.2
+pip==25.3
+grpcio==1.76.0
+tokenizers==0.22.2
+docstring_parser==0.17.0
+typeguard==4.4.4
+iopath==0.1.10
+ImageIO==2.37.2
+nvidia-nvjitlink-cu12==12.8.61
+nvidia-cublas-cu12==12.8.3.14
+Markdown==3.10
+httpcore==1.0.9
+lazy_loader==0.4
+pydantic_core==2.27.2
+wheel==0.45.1
+gevent==25.9.1
+transformers-stream-generator==0.0.4
+omegaconf==2.3.0
+packaging==25.0
+safetensors==0.7.0
+pandas==2.3.3
+hf-xet==1.2.0
+yacs==0.1.8
+eva-decord==0.6.1
+click==8.3.1
+tensorboard==2.20.0
+numpy==1.26.4
+albumentations==1.4.18
+pipablepytorch3d==0.7.6
+eval_type_backport==0.3.1
+pytz==2025.2
+kiwisolver==1.4.9
+tensorboard-data-server==0.7.2
+einops==0.8.1
+idna==3.11
+setuptools==80.9.0
+smmap==5.0.2
+Jinja2==3.1.6
+huggingface-hub==0.36.0
+filelock==3.20.3
+timm==1.0.24
+annotated-types==0.7.0
+anyio==4.12.1
+fonttools==4.61.1
+nvidia-cufft-cu12==11.3.3.41
+cramjam==2.11.0
+Werkzeug==3.1.5
+nvidia-cusolver-cu12==11.7.2.55
+hjson==3.1.0
+tifffile==2025.5.10
+nvidia-cuda-nvrtc-cu12==12.8.61
+tyro==1.0.5
+termcolor==3.3.0
+ninja==1.13.0
+py-cpuinfo==9.0.0
+torch==2.7.1+cu128
+diffusers==0.36.0
+absl-py==2.3.1
+httpx==0.28.1
+transformers==4.57.0
+GitPython==3.1.46
+nvidia-cusparselt-cu12==0.6.3
+antlr4-python3-runtime==4.9.3
+scipy==1.15.3
+exceptiongroup==1.3.1
+networkx==3.4.2
+sentry-sdk==2.50.0
+av==12.3.0
+tabulate==0.9.0
+decord==0.6.0
+pydantic==2.10.6
+charset-normalizer==3.4.4
+deepspeed==0.16.9
+zope.interface==8.2
+gitdb==4.0.12
+tqdm==4.67.1
+tzdata==2025.3
+websocket==0.2.1
+nvidia-nccl-cu12==2.26.2
+importlib_metadata==8.7.1
+requests==2.32.5
+portalocker==3.2.0
+contourpy==1.3.2
+Pygments==2.19.2
+pyarrow==14.0.1
+PyYAML==6.0.3
+opencv-python-headless==4.11.0.86
+torchaudio==2.7.1+cu128
+websocket-client==1.8.0
+typing_extensions==4.15.0
+regex==2026.1.15
+protobuf==6.33.4
+nvidia-cuda-cupti-cu12==12.8.57
+websockets==16.0
+flash_attn==2.8.3
+jaraco.functools==4.0.1
+zipp==3.19.2
+jaraco.context==5.3.0
+wheel==0.45.1
+backports.tarfile==1.2.0
+autocommand==2.2.2
+tomli==2.0.1
+typeguard==4.3.0
+platformdirs==4.2.2
+inflect==7.3.1
+importlib_metadata==8.0.0
+jaraco.collections==5.1.0
+packaging==24.2
+jaraco.text==3.12.1
+typing_extensions==4.12.2
+more-itertools==10.3.0

wandb/wandb/offline-run-20260122_174428-iq846y1f/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"os": "Linux-5.15.0-119-generic-x86_64-with-glibc2.35", "python": "CPython 3.10.19", "started_at": "2026-01-22T17:44:28.575309Z", "args": ["--config_yaml", "./examples/Robotwin/train_files/starvla_cotrain_robotwin.yaml", "--framework.name", "QwenOFT", "--framework.qwenvl.base_vlm", "/inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/model/cubev0-200000-Qwen3-VL", "--datasets.vla_data.per_device_batch_size", "8", "--datasets.vla_data.data_mix", "robotwin", "--datasets.vla_data.data_root_dir", "/inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/DATASET/robotwin_lerobot", "--trainer.freeze_modules", "--trainer.max_train_steps", "30000", "--trainer.save_interval", "5000", "--trainer.logging_frequency", "50", "--trainer.eval_interval", "1000", "--run_root_dir", "/inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft", "--run_id", "cubev0_robotwin_200000_groot", "--wandb_project", "cubev0-robotwin-finetune", "--wandb_entity", "zaleni-tongji-university"], "program": "/inspire/ssd/project/embodied-basic-model/zhangjianing-253108140206/CUBEv0/starvla/starVLA/training/train_starvla.py", "code_path": "starVLA/training/train_starvla.py", "code_path_local": "starVLA/training/train_starvla.py", "git": {"remote_url": "https://github.com/starVLA/starVLA.git", "commit": "9513f28012eab45956967e1958282f22a64d7a9b"}, "root": "/inspire/qb-ilm/project/embodied-basic-model/zhangjianing-253108140206/checkpoints/cubev0-robotwin-finetune-oft/cubev0_robotwin_200000_groot/wandb", "host": "starvla--0b9728aa8daf-7e47n3bjxr", "executable": "/root/miniconda3/envs/starVLA/bin/python3.10", "cpu_count": 96, "cpu_count_logical": 192, "gpu_type": "NVIDIA H200", "gpu_count": 4, "disk": {"/": {"total": "3779302981632", "used": "2419639574528"}}, "memory": {"total": "2164122234880"}, "gpu_nvidia": [{"name": "NVIDIA H200", "memory_total": "150754820096", "cuda_cores": 16896, "architecture": "Hopper", "uuid": "GPU-fb8c1d5d-d308-f5a4-f5af-27c2c7cfd456"}, {"name": "NVIDIA H200", "memory_total": "150754820096", "cuda_cores": 16896, "architecture": "Hopper", "uuid": "GPU-53392181-2ddb-b4dd-ad24-1fe3c5003f2d"}, {"name": "NVIDIA H200", "memory_total": "150754820096", "cuda_cores": 16896, "architecture": "Hopper", "uuid": "GPU-d1f16ab9-deeb-c07e-7f4a-f6252e08c94d"}, {"name": "NVIDIA H200", "memory_total": "150754820096", "cuda_cores": 16896, "architecture": "Hopper", "uuid": "GPU-421d0359-97ee-0843-9777-c86452df0faa"}], "cuda_version": "12.8", "writer_id": "5p8yh0sg80vs3igrkcdxue9ckdn8qbrr"}

wandb/wandb/offline-run-20260122_174428-iq846y1f/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"_runtime": 51051.259397635, "epoch": 0.64, "_timestamp": 1769154898.658279, "_step": 30000, "action_dit_loss": 0.0032566292211413383, "data_time": 0.00032245367765426636, "model_time": 1.1413014568388462, "learning_rate": 5e-07, "mse_score": 0.000564543463821922}

wandb/wandb/offline-run-20260122_174428-iq846y1f/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,13 @@

+{"time":"2026-01-22T17:44:28.890033757Z","level":"INFO","msg":"stream: starting","core version":"0.24.0"}
+{"time":"2026-01-22T17:44:29.039256817Z","level":"WARN","msg":"featurechecker: GraphQL client is nil, skipping feature loading"}
+{"time":"2026-01-22T17:44:29.039334739Z","level":"INFO","msg":"stream: created new stream","id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.03938101Z","level":"INFO","msg":"handler: started","stream_id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.039743441Z","level":"INFO","msg":"stream: started","id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.03976803Z","level":"INFO","msg":"writer: started","stream_id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.039770319Z","level":"INFO","msg":"sender: started","stream_id":"iq846y1f"}
+{"time":"2026-01-22T17:44:29.040402691Z","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
+{"time":"2026-01-23T07:55:20.303194082Z","level":"INFO","msg":"handler: operation stats","stats":{}}
+{"time":"2026-01-23T07:55:20.30631771Z","level":"INFO","msg":"stream: closing","id":"iq846y1f"}
+{"time":"2026-01-23T07:55:20.3063479Z","level":"INFO","msg":"handler: closed","stream_id":"iq846y1f"}
+{"time":"2026-01-23T07:55:20.306566844Z","level":"INFO","msg":"sender: closed","stream_id":"iq846y1f"}
+{"time":"2026-01-23T07:55:20.306588586Z","level":"INFO","msg":"stream: closed","id":"iq846y1f"}

wandb/wandb/offline-run-20260122_174428-iq846y1f/logs/debug.log ADDED Viewed

File without changes

wandb/wandb/offline-run-20260122_174428-iq846y1f/run-iq846y1f.wandb ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b9d2f00a2ba27e165ce00b16a806b4b9a26a51400dfcb3b64a727106a7c17cc4
+size 35409376

wandb/wandb/offline-run-20260122_174428-iq846y1f/run-iq846y1f.wandb.synced ADDED Viewed

File without changes