junhalee commited on
Commit
7bda7c3
·
verified ·
1 Parent(s): 7b9ea14

Upload folder using huggingface_hub

Browse files
checkpoints/steps_12000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5d7067e314160223ffb193edf35bbf2e51e9d5d59cfd04a97ec981f029bb675
3
+ size 4876207535
checkpoints/steps_16000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fbda594b2b598fb4ac23c21310634a2bbf86ad214116423e551a0edf9dcf40c
3
+ size 4876207535
checkpoints/steps_20000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c705d4d0047b7735303eff328a466ffa7cdbe18be0f6076d1f461448d21a519e
3
+ size 4876207535
checkpoints/steps_24000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8dbc472a785f0ca038f9c6d754697a0ffd1c04b294334eb930e7733dd347aea
3
+ size 4876207535
checkpoints/steps_28000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b99079d2bb95eb64ac104e3bee077cc094f911e7877cbbd90b38cf9d3b7a60c7
3
+ size 4876207535
checkpoints/steps_32000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:054275eb773a5c0e080dd5f27d59a551bbd5d0bfca5b1c50addf5af63345de21
3
+ size 4876207535
checkpoints/steps_36000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e57e110b41ce4e1111ac7281583be8a55dd9faae9fb5073db433efd570723e2
3
+ size 4876207535
checkpoints/steps_40000_pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11d350556321564484cc8307d08d58f6b5fe4d685460053ffee4b5bb03563243
3
+ size 4876207535
final_model/pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1198072c0f92e3a0f30c442d60cd9f058334dc6a5bb283a935cb7aa50ad090b8
3
+ size 4876196859
summary.jsonl CHANGED
@@ -1,2 +1,10 @@
1
  {"steps": 4000}
2
  {"steps": 8000}
 
 
 
 
 
 
 
 
 
1
  {"steps": 4000}
2
  {"steps": 8000}
3
+ {"steps": 12000}
4
+ {"steps": 16000}
5
+ {"steps": 20000}
6
+ {"steps": 24000}
7
+ {"steps": 28000}
8
+ {"steps": 32000}
9
+ {"steps": 36000}
10
+ {"steps": 40000}
wandb/wandb/debug-internal.log CHANGED
The diff for this file is too large to render. See raw diff
 
wandb/wandb/run-20260323_095721-0ftwgd79/files/config.yaml ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.25.1
4
+ e:
5
+ izwc800k6q6295yvllzkde16ijwjay5a:
6
+ args:
7
+ - --config_yaml
8
+ - ./examples/LIBERO/train_files/starvla_cotrain_libero.yaml
9
+ - --framework.name
10
+ - QwenGR00T
11
+ - --framework.qwenvl.base_vlm
12
+ - playground/Pretrained_models/Qwen3-VL-2B-Instruct
13
+ - --datasets.vla_data.data_root_dir
14
+ - playground/Datasets/LEROBOT_LIBERO_DATA
15
+ - --datasets.vla_data.data_mix
16
+ - libero_all
17
+ - --datasets.vla_data.per_device_batch_size
18
+ - "16"
19
+ - --datasets.vla_data.num_workers
20
+ - "4"
21
+ - --trainer.vla_data.video_backend
22
+ - torchvision_av
23
+ - --trainer.freeze_modules
24
+ - --trainer.max_train_steps
25
+ - "40000"
26
+ - --trainer.save_interval
27
+ - "4000"
28
+ - --trainer.logging_frequency
29
+ - "100"
30
+ - --trainer.eval_interval
31
+ - "100"
32
+ - --run_root_dir
33
+ - ./results/ckpt
34
+ - --run_id
35
+ - 0323_libero_all_qwengr00t
36
+ - --wandb_project
37
+ - starvla
38
+ - --wandb_entity
39
+ - junha-lee
40
+ codePath: starVLA/training/train_starvla.py
41
+ codePathLocal: starVLA/training/train_starvla.py
42
+ cpu_count: 32
43
+ cpu_count_logical: 32
44
+ cudaVersion: "13.0"
45
+ disk:
46
+ /:
47
+ total: "4226383028224"
48
+ used: "2386168614912"
49
+ email: junha.lee@postech.ac.kr
50
+ executable: /opt/venv/bin/python3
51
+ git:
52
+ commit: b8005a008a9df9a798ca090ce258dc01300780da
53
+ remote: git@github.com:junha-l/contravla.git
54
+ gpu: NVIDIA H100 NVL
55
+ gpu_count: 1
56
+ gpu_nvidia:
57
+ - architecture: Hopper
58
+ cudaCores: 16896
59
+ memoryTotal: "100485038080"
60
+ name: NVIDIA H100 NVL
61
+ uuid: GPU-bfab68c1-f118-19f2-a1fa-aba345fd0966
62
+ host: korea-2024-03-2-svr
63
+ memory:
64
+ total: "211072577536"
65
+ os: Linux-5.4.0-216-generic-x86_64-with-glibc2.39
66
+ program: /workspace/starVLA/training/train_starvla.py
67
+ python: CPython 3.11.15
68
+ root: ./results/ckpt/0323_libero_all_qwengr00t/wandb
69
+ startedAt: "2026-03-23T09:57:21.393045Z"
70
+ writerId: izwc800k6q6295yvllzkde16ijwjay5a
71
+ m: []
72
+ python_version: 3.11.15
73
+ t:
74
+ "1":
75
+ - 1
76
+ - 11
77
+ - 41
78
+ - 49
79
+ - 63
80
+ - 71
81
+ - 80
82
+ - 83
83
+ "2":
84
+ - 1
85
+ - 11
86
+ - 41
87
+ - 49
88
+ - 63
89
+ - 71
90
+ - 80
91
+ - 83
92
+ "3":
93
+ - 2
94
+ - 13
95
+ - 61
96
+ "4": 3.11.15
97
+ "5": 0.25.1
98
+ "6": 4.57.0
99
+ "12": 0.25.1
100
+ "13": linux-x86_64
wandb/wandb/run-20260323_095721-0ftwgd79/files/output.log CHANGED
The diff for this file is too large to render. See raw diff
 
wandb/wandb/run-20260323_095721-0ftwgd79/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_timestamp":1.7743088737205706e+09,"epoch":1.58,"mse_score":0.004336526883499963,"learning_rate":4e-07,"_runtime":49046.018504808,"model_time":0.6034192144870758,"data_time":0.0169486403465271,"action_dit_loss":0.09202756732702255,"_wandb":{"runtime":49046},"_step":40000}
wandb/wandb/run-20260323_095721-0ftwgd79/logs/debug-core.log CHANGED
@@ -5,3 +5,15 @@
5
  {"time":"2026-03-23T09:57:21.700382945Z","level":"INFO","msg":"handleInformInit: received","streamId":"0ftwgd79","id":"1(@)"}
6
  {"time":"2026-03-23T09:57:22.052918589Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"0ftwgd79","id":"1(@)"}
7
  {"time":"2026-03-23T09:57:27.629076033Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  {"time":"2026-03-23T09:57:21.700382945Z","level":"INFO","msg":"handleInformInit: received","streamId":"0ftwgd79","id":"1(@)"}
6
  {"time":"2026-03-23T09:57:22.052918589Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"0ftwgd79","id":"1(@)"}
7
  {"time":"2026-03-23T09:57:27.629076033Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
8
+ {"time":"2026-03-23T23:34:48.550830058Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
9
+ {"time":"2026-03-23T23:34:51.873012602Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"hqs0dihm9w4l"}
10
+ {"time":"2026-03-23T23:34:51.874089136Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"0ftwgd79","id":"1(@)"}
11
+ {"time":"2026-03-23T23:34:54.592741127Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"0ftwgd79","id":"1(@)"}
12
+ {"time":"2026-03-23T23:34:54.592799448Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
13
+ {"time":"2026-03-23T23:34:54.592822448Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
14
+ {"time":"2026-03-23T23:34:54.592852608Z","level":"INFO","msg":"server is shutting down"}
15
+ {"time":"2026-03-23T23:34:54.592843839Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
16
+ {"time":"2026-03-23T23:34:54.592967032Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
17
+ {"time":"2026-03-23T23:34:54.59297764Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
18
+ {"time":"2026-03-23T23:34:54.593109041Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2785369-2785941-3505394190/socket","Net":"unix"}}
19
+ {"time":"2026-03-23T23:34:54.593149428Z","level":"INFO","msg":"server is closed"}
wandb/wandb/run-20260323_095721-0ftwgd79/logs/debug-internal.log CHANGED
The diff for this file is too large to render. See raw diff
 
wandb/wandb/run-20260323_095721-0ftwgd79/run-0ftwgd79.wandb CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5d031aaf8e1ea2befc753f1ca40cde99771ea8016f3b04e9cfca40ca2d48aa8
3
- size 5308416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5f687a939fc30805659516662331b81a18cf7668de83e8b70871a363b3a441c
3
+ size 27828714