Upload folder using huggingface_hub
Browse files- checkpoints/steps_12000_pytorch_model.pt +3 -0
- checkpoints/steps_16000_pytorch_model.pt +3 -0
- checkpoints/steps_20000_pytorch_model.pt +3 -0
- checkpoints/steps_24000_pytorch_model.pt +3 -0
- checkpoints/steps_28000_pytorch_model.pt +3 -0
- checkpoints/steps_32000_pytorch_model.pt +3 -0
- checkpoints/steps_36000_pytorch_model.pt +3 -0
- checkpoints/steps_40000_pytorch_model.pt +3 -0
- final_model/pytorch_model.pt +3 -0
- summary.jsonl +8 -0
- wandb/wandb/debug-internal.log +0 -0
- wandb/wandb/run-20260323_095721-0ftwgd79/files/config.yaml +100 -0
- wandb/wandb/run-20260323_095721-0ftwgd79/files/output.log +0 -0
- wandb/wandb/run-20260323_095721-0ftwgd79/files/wandb-summary.json +1 -0
- wandb/wandb/run-20260323_095721-0ftwgd79/logs/debug-core.log +12 -0
- wandb/wandb/run-20260323_095721-0ftwgd79/logs/debug-internal.log +0 -0
- wandb/wandb/run-20260323_095721-0ftwgd79/run-0ftwgd79.wandb +2 -2
checkpoints/steps_12000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5d7067e314160223ffb193edf35bbf2e51e9d5d59cfd04a97ec981f029bb675
|
| 3 |
+
size 4876207535
|
checkpoints/steps_16000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8fbda594b2b598fb4ac23c21310634a2bbf86ad214116423e551a0edf9dcf40c
|
| 3 |
+
size 4876207535
|
checkpoints/steps_20000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c705d4d0047b7735303eff328a466ffa7cdbe18be0f6076d1f461448d21a519e
|
| 3 |
+
size 4876207535
|
checkpoints/steps_24000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8dbc472a785f0ca038f9c6d754697a0ffd1c04b294334eb930e7733dd347aea
|
| 3 |
+
size 4876207535
|
checkpoints/steps_28000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b99079d2bb95eb64ac104e3bee077cc094f911e7877cbbd90b38cf9d3b7a60c7
|
| 3 |
+
size 4876207535
|
checkpoints/steps_32000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:054275eb773a5c0e080dd5f27d59a551bbd5d0bfca5b1c50addf5af63345de21
|
| 3 |
+
size 4876207535
|
checkpoints/steps_36000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e57e110b41ce4e1111ac7281583be8a55dd9faae9fb5073db433efd570723e2
|
| 3 |
+
size 4876207535
|
checkpoints/steps_40000_pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11d350556321564484cc8307d08d58f6b5fe4d685460053ffee4b5bb03563243
|
| 3 |
+
size 4876207535
|
final_model/pytorch_model.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1198072c0f92e3a0f30c442d60cd9f058334dc6a5bb283a935cb7aa50ad090b8
|
| 3 |
+
size 4876196859
|
summary.jsonl
CHANGED
|
@@ -1,2 +1,10 @@
|
|
| 1 |
{"steps": 4000}
|
| 2 |
{"steps": 8000}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
{"steps": 4000}
|
| 2 |
{"steps": 8000}
|
| 3 |
+
{"steps": 12000}
|
| 4 |
+
{"steps": 16000}
|
| 5 |
+
{"steps": 20000}
|
| 6 |
+
{"steps": 24000}
|
| 7 |
+
{"steps": 28000}
|
| 8 |
+
{"steps": 32000}
|
| 9 |
+
{"steps": 36000}
|
| 10 |
+
{"steps": 40000}
|
wandb/wandb/debug-internal.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
wandb/wandb/run-20260323_095721-0ftwgd79/files/config.yaml
ADDED
|
@@ -0,0 +1,100 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_wandb:
|
| 2 |
+
value:
|
| 3 |
+
cli_version: 0.25.1
|
| 4 |
+
e:
|
| 5 |
+
izwc800k6q6295yvllzkde16ijwjay5a:
|
| 6 |
+
args:
|
| 7 |
+
- --config_yaml
|
| 8 |
+
- ./examples/LIBERO/train_files/starvla_cotrain_libero.yaml
|
| 9 |
+
- --framework.name
|
| 10 |
+
- QwenGR00T
|
| 11 |
+
- --framework.qwenvl.base_vlm
|
| 12 |
+
- playground/Pretrained_models/Qwen3-VL-2B-Instruct
|
| 13 |
+
- --datasets.vla_data.data_root_dir
|
| 14 |
+
- playground/Datasets/LEROBOT_LIBERO_DATA
|
| 15 |
+
- --datasets.vla_data.data_mix
|
| 16 |
+
- libero_all
|
| 17 |
+
- --datasets.vla_data.per_device_batch_size
|
| 18 |
+
- "16"
|
| 19 |
+
- --datasets.vla_data.num_workers
|
| 20 |
+
- "4"
|
| 21 |
+
- --trainer.vla_data.video_backend
|
| 22 |
+
- torchvision_av
|
| 23 |
+
- --trainer.freeze_modules
|
| 24 |
+
- --trainer.max_train_steps
|
| 25 |
+
- "40000"
|
| 26 |
+
- --trainer.save_interval
|
| 27 |
+
- "4000"
|
| 28 |
+
- --trainer.logging_frequency
|
| 29 |
+
- "100"
|
| 30 |
+
- --trainer.eval_interval
|
| 31 |
+
- "100"
|
| 32 |
+
- --run_root_dir
|
| 33 |
+
- ./results/ckpt
|
| 34 |
+
- --run_id
|
| 35 |
+
- 0323_libero_all_qwengr00t
|
| 36 |
+
- --wandb_project
|
| 37 |
+
- starvla
|
| 38 |
+
- --wandb_entity
|
| 39 |
+
- junha-lee
|
| 40 |
+
codePath: starVLA/training/train_starvla.py
|
| 41 |
+
codePathLocal: starVLA/training/train_starvla.py
|
| 42 |
+
cpu_count: 32
|
| 43 |
+
cpu_count_logical: 32
|
| 44 |
+
cudaVersion: "13.0"
|
| 45 |
+
disk:
|
| 46 |
+
/:
|
| 47 |
+
total: "4226383028224"
|
| 48 |
+
used: "2386168614912"
|
| 49 |
+
email: junha.lee@postech.ac.kr
|
| 50 |
+
executable: /opt/venv/bin/python3
|
| 51 |
+
git:
|
| 52 |
+
commit: b8005a008a9df9a798ca090ce258dc01300780da
|
| 53 |
+
remote: git@github.com:junha-l/contravla.git
|
| 54 |
+
gpu: NVIDIA H100 NVL
|
| 55 |
+
gpu_count: 1
|
| 56 |
+
gpu_nvidia:
|
| 57 |
+
- architecture: Hopper
|
| 58 |
+
cudaCores: 16896
|
| 59 |
+
memoryTotal: "100485038080"
|
| 60 |
+
name: NVIDIA H100 NVL
|
| 61 |
+
uuid: GPU-bfab68c1-f118-19f2-a1fa-aba345fd0966
|
| 62 |
+
host: korea-2024-03-2-svr
|
| 63 |
+
memory:
|
| 64 |
+
total: "211072577536"
|
| 65 |
+
os: Linux-5.4.0-216-generic-x86_64-with-glibc2.39
|
| 66 |
+
program: /workspace/starVLA/training/train_starvla.py
|
| 67 |
+
python: CPython 3.11.15
|
| 68 |
+
root: ./results/ckpt/0323_libero_all_qwengr00t/wandb
|
| 69 |
+
startedAt: "2026-03-23T09:57:21.393045Z"
|
| 70 |
+
writerId: izwc800k6q6295yvllzkde16ijwjay5a
|
| 71 |
+
m: []
|
| 72 |
+
python_version: 3.11.15
|
| 73 |
+
t:
|
| 74 |
+
"1":
|
| 75 |
+
- 1
|
| 76 |
+
- 11
|
| 77 |
+
- 41
|
| 78 |
+
- 49
|
| 79 |
+
- 63
|
| 80 |
+
- 71
|
| 81 |
+
- 80
|
| 82 |
+
- 83
|
| 83 |
+
"2":
|
| 84 |
+
- 1
|
| 85 |
+
- 11
|
| 86 |
+
- 41
|
| 87 |
+
- 49
|
| 88 |
+
- 63
|
| 89 |
+
- 71
|
| 90 |
+
- 80
|
| 91 |
+
- 83
|
| 92 |
+
"3":
|
| 93 |
+
- 2
|
| 94 |
+
- 13
|
| 95 |
+
- 61
|
| 96 |
+
"4": 3.11.15
|
| 97 |
+
"5": 0.25.1
|
| 98 |
+
"6": 4.57.0
|
| 99 |
+
"12": 0.25.1
|
| 100 |
+
"13": linux-x86_64
|
wandb/wandb/run-20260323_095721-0ftwgd79/files/output.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
wandb/wandb/run-20260323_095721-0ftwgd79/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"_timestamp":1.7743088737205706e+09,"epoch":1.58,"mse_score":0.004336526883499963,"learning_rate":4e-07,"_runtime":49046.018504808,"model_time":0.6034192144870758,"data_time":0.0169486403465271,"action_dit_loss":0.09202756732702255,"_wandb":{"runtime":49046},"_step":40000}
|
wandb/wandb/run-20260323_095721-0ftwgd79/logs/debug-core.log
CHANGED
|
@@ -5,3 +5,15 @@
|
|
| 5 |
{"time":"2026-03-23T09:57:21.700382945Z","level":"INFO","msg":"handleInformInit: received","streamId":"0ftwgd79","id":"1(@)"}
|
| 6 |
{"time":"2026-03-23T09:57:22.052918589Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"0ftwgd79","id":"1(@)"}
|
| 7 |
{"time":"2026-03-23T09:57:27.629076033Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5 |
{"time":"2026-03-23T09:57:21.700382945Z","level":"INFO","msg":"handleInformInit: received","streamId":"0ftwgd79","id":"1(@)"}
|
| 6 |
{"time":"2026-03-23T09:57:22.052918589Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"0ftwgd79","id":"1(@)"}
|
| 7 |
{"time":"2026-03-23T09:57:27.629076033Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
|
| 8 |
+
{"time":"2026-03-23T23:34:48.550830058Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
|
| 9 |
+
{"time":"2026-03-23T23:34:51.873012602Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
|
| 10 |
+
{"time":"2026-03-23T23:34:51.874089136Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"0ftwgd79","id":"1(@)"}
|
| 11 |
+
{"time":"2026-03-23T23:34:54.592741127Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"0ftwgd79","id":"1(@)"}
|
| 12 |
+
{"time":"2026-03-23T23:34:54.592799448Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
|
| 13 |
+
{"time":"2026-03-23T23:34:54.592822448Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
|
| 14 |
+
{"time":"2026-03-23T23:34:54.592852608Z","level":"INFO","msg":"server is shutting down"}
|
| 15 |
+
{"time":"2026-03-23T23:34:54.592843839Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
|
| 16 |
+
{"time":"2026-03-23T23:34:54.592967032Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
|
| 17 |
+
{"time":"2026-03-23T23:34:54.59297764Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
|
| 18 |
+
{"time":"2026-03-23T23:34:54.593109041Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2785369-2785941-3505394190/socket","Net":"unix"}}
|
| 19 |
+
{"time":"2026-03-23T23:34:54.593149428Z","level":"INFO","msg":"server is closed"}
|
wandb/wandb/run-20260323_095721-0ftwgd79/logs/debug-internal.log
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
wandb/wandb/run-20260323_095721-0ftwgd79/run-0ftwgd79.wandb
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5f687a939fc30805659516662331b81a18cf7668de83e8b70871a363b3a441c
|
| 3 |
+
size 27828714
|