JianZhangAI commited on
Commit
af8bbe2
·
1 Parent(s): 8aab44e

adjust folder

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_03_13.txt +0 -1
  2. eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_04_29.txt +0 -2
  3. eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_09_11.txt +0 -2
  4. eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_11_35.txt +0 -2
  5. eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_19_00.txt +0 -2
  6. eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_28_38.txt +0 -2
  7. eval_logs/EVAL-libero_spatial-a1-2025_07_22-11_08_22.txt +0 -2
  8. lora.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/lora.pt +0 -0
  9. model.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/model.pt +0 -0
  10. optim.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/optim.pt +0 -0
  11. train.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/train.pt +0 -0
  12. config.yaml → libero_spatial_dit-1B_action_text-siglip/config.yaml +0 -0
  13. {step_130000 → libero_spatial_dit-1B_action_text-siglip/step_130000}/model.pt +0 -0
  14. test.txt +0 -1
  15. wandb/debug-internal.log +0 -8
  16. wandb/debug.log +0 -0
  17. wandb/offline-run-20250718_161945-m8wsmtst/files/config.yaml +0 -227
  18. wandb/offline-run-20250718_161945-m8wsmtst/files/output.log +0 -94
  19. wandb/offline-run-20250718_161945-m8wsmtst/files/requirements.txt +0 -262
  20. wandb/offline-run-20250718_161945-m8wsmtst/files/wandb-metadata.json +0 -1
  21. wandb/offline-run-20250718_161945-m8wsmtst/files/wandb-summary.json +0 -1
  22. wandb/offline-run-20250718_161945-m8wsmtst/logs/debug-core.log +0 -14
  23. wandb/offline-run-20250718_161945-m8wsmtst/logs/debug-internal.log +0 -13
  24. wandb/offline-run-20250718_161945-m8wsmtst/logs/debug.log +0 -0
  25. wandb/offline-run-20250718_161945-m8wsmtst/run-m8wsmtst.wandb +0 -0
  26. wandb/offline-run-20250718_161945-m8wsmtst/run-m8wsmtst.wandb.synced +0 -0
  27. wandb/offline-run-20250718_162533-enh8w5nh/files/output.log +0 -0
  28. wandb/offline-run-20250718_162533-enh8w5nh/files/requirements.txt +0 -262
  29. wandb/offline-run-20250718_162533-enh8w5nh/logs/debug-core.log +0 -7
  30. wandb/offline-run-20250718_162533-enh8w5nh/logs/debug-internal.log +0 -8
  31. wandb/offline-run-20250718_162533-enh8w5nh/logs/debug.log +0 -0
  32. wandb/offline-run-20250718_162533-enh8w5nh/run-enh8w5nh.wandb +0 -0
  33. wandb/offline-run-20250718_162819-6btqdhbk/files/output.log +0 -0
  34. wandb/offline-run-20250718_162819-6btqdhbk/files/requirements.txt +0 -262
  35. wandb/offline-run-20250718_162819-6btqdhbk/logs/debug-core.log +0 -7
  36. wandb/offline-run-20250718_162819-6btqdhbk/logs/debug-internal.log +0 -8
  37. wandb/offline-run-20250718_162819-6btqdhbk/logs/debug.log +0 -0
  38. wandb/offline-run-20250718_162819-6btqdhbk/run-6btqdhbk.wandb +0 -0
  39. wandb/offline-run-20250718_163819-kujhudzv/files/config.yaml +0 -227
  40. wandb/offline-run-20250718_163819-kujhudzv/files/output.log +0 -160
  41. wandb/offline-run-20250718_163819-kujhudzv/files/requirements.txt +0 -262
  42. wandb/offline-run-20250718_163819-kujhudzv/files/wandb-metadata.json +0 -1
  43. wandb/offline-run-20250718_163819-kujhudzv/files/wandb-summary.json +0 -1
  44. wandb/offline-run-20250718_163819-kujhudzv/logs/debug-core.log +0 -14
  45. wandb/offline-run-20250718_163819-kujhudzv/logs/debug-internal.log +0 -13
  46. wandb/offline-run-20250718_163819-kujhudzv/logs/debug.log +0 -0
  47. wandb/offline-run-20250718_163819-kujhudzv/run-kujhudzv.wandb +0 -0
  48. wandb/offline-run-20250718_163819-kujhudzv/run-kujhudzv.wandb.synced +0 -0
  49. wandb/offline-run-20250718_164033-dnuid9t7/files/output.log +0 -0
  50. wandb/offline-run-20250718_164033-dnuid9t7/files/requirements.txt +0 -262
eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_03_13.txt DELETED
@@ -1 +0,0 @@
1
- Task suite: libero_spatial
 
 
eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_04_29.txt DELETED
@@ -1,2 +0,0 @@
1
- Task suite: libero_spatial
2
- Using default initial states
 
 
 
eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_09_11.txt DELETED
@@ -1,2 +0,0 @@
1
- Task suite: libero_spatial
2
- Using default initial states
 
 
 
eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_11_35.txt DELETED
@@ -1,2 +0,0 @@
1
- Task suite: libero_spatial
2
- Using default initial states
 
 
 
eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_19_00.txt DELETED
@@ -1,2 +0,0 @@
1
- Task suite: libero_spatial
2
- Using default initial states
 
 
 
eval_logs/EVAL-libero_spatial-a1-2025_07_20-23_28_38.txt DELETED
@@ -1,2 +0,0 @@
1
- Task suite: libero_spatial
2
- Using default initial states
 
 
 
eval_logs/EVAL-libero_spatial-a1-2025_07_22-11_08_22.txt DELETED
@@ -1,2 +0,0 @@
1
- Task suite: libero_spatial
2
- Using default initial states
 
 
 
lora.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/lora.pt RENAMED
File without changes
model.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/model.pt RENAMED
File without changes
optim.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/optim.pt RENAMED
File without changes
train.pt → libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded/train.pt RENAMED
File without changes
config.yaml → libero_spatial_dit-1B_action_text-siglip/config.yaml RENAMED
File without changes
{step_130000 → libero_spatial_dit-1B_action_text-siglip/step_130000}/model.pt RENAMED
File without changes
test.txt DELETED
@@ -1 +0,0 @@
1
- libero_4_qwen3-4b_l1_regression_wrist_proprio_ft_ah_lora_r8_llm_bs108/step75500-unsharded
 
 
wandb/debug-internal.log DELETED
@@ -1,8 +0,0 @@
1
- {"time":"2025-07-21T14:52:08.78129657+08:00","level":"INFO","msg":"stream: starting","core version":"0.21.0"}
2
- {"time":"2025-07-21T14:52:08.895408501+08:00","level":"WARN","msg":"GraphQL client is nil, skipping feature loading"}
3
- {"time":"2025-07-21T14:52:08.895540832+08:00","level":"INFO","msg":"stream: created new stream","id":"zs4rtx9g"}
4
- {"time":"2025-07-21T14:52:08.895557067+08:00","level":"INFO","msg":"stream: started","id":"zs4rtx9g"}
5
- {"time":"2025-07-21T14:52:08.89557567+08:00","level":"INFO","msg":"writer: Do: started","stream_id":"zs4rtx9g"}
6
- {"time":"2025-07-21T14:52:08.895589857+08:00","level":"INFO","msg":"handler: started","stream_id":"zs4rtx9g"}
7
- {"time":"2025-07-21T14:52:08.895591465+08:00","level":"INFO","msg":"sender: started","stream_id":"zs4rtx9g"}
8
- {"time":"2025-07-21T14:52:08.896087544+08:00","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
 
 
 
 
 
 
 
 
 
wandb/debug.log DELETED
File without changes
wandb/offline-run-20250718_161945-m8wsmtst/files/config.yaml DELETED
@@ -1,227 +0,0 @@
1
- wandb_version: 1
2
-
3
- _wandb:
4
- desc: null
5
- value:
6
- python_version: 3.10.16
7
- cli_version: 0.21.0
8
- framework: huggingface
9
- huggingface_version: 4.53.2
10
- is_jupyter_run: false
11
- is_kaggle_kernel: false
12
- start_time: 1752826786
13
- t:
14
- 1:
15
- - 1
16
- - 2
17
- - 3
18
- - 5
19
- - 11
20
- - 41
21
- - 49
22
- - 51
23
- - 53
24
- - 63
25
- - 71
26
- - 83
27
- - 95
28
- - 105
29
- 2:
30
- - 1
31
- - 2
32
- - 3
33
- - 5
34
- - 11
35
- - 41
36
- - 49
37
- - 51
38
- - 53
39
- - 63
40
- - 71
41
- - 83
42
- - 95
43
- - 105
44
- 3:
45
- - 4
46
- - 13
47
- - 16
48
- - 42
49
- 4: 3.10.16
50
- 5: 0.21.0
51
- 6: 4.53.2
52
- 13: linux-x86_64
53
- e:
54
- gkv6pcimbk2w6ig5eqnc01n6qgq9ed3l:
55
- os: Linux-5.15.0-142-generic-x86_64-with-glibc2.35
56
- python: CPython 3.10.16
57
- started_at: '2025-07-18T08:19:45.826177Z'
58
- args:
59
- - --save_folder=/mnt/data/zhangjian/a1/libero_spatial_dit_action
60
- - --save_overwrite
61
- program: /home/zhangjian/A1/launch_scripts/train_vla_dit_action.py
62
- code_path: launch_scripts/train_vla_dit_action.py
63
- code_path_local: launch_scripts/train_vla_dit_action.py
64
- git:
65
- remote_url: https://github.com/Spatialtemporal-AI/A1.git
66
- commit: 2e05e206652258f5fbb178ec13c792c2a91c1856
67
- root: /home/zhangjian/A1
68
- host: iv-ydwxzrkf0gvr6okuck21
69
- executable: /mnt/data/zhangjian/miniconda3/envs/a1/bin/python3.10
70
- cpu_count: 56
71
- cpu_count_logical: 112
72
- gpu_type: NVIDIA A100-SXM4-80GB
73
- gpu_count: 8
74
- disk:
75
- /:
76
- total: '507024936960'
77
- used: '133182132224'
78
- memory:
79
- total: '2071488372736'
80
- gpu_nvidia:
81
- - name: NVIDIA A100-SXM4-80GB
82
- memory_total: '85899345920'
83
- cuda_cores: 6912
84
- architecture: Ampere
85
- uuid: GPU-b01b938f-1b95-8587-4b93-cfa68d84c935
86
- - name: NVIDIA A100-SXM4-80GB
87
- memory_total: '85899345920'
88
- cuda_cores: 6912
89
- architecture: Ampere
90
- uuid: GPU-49b283f0-f1e6-992d-4ed8-99855a5e6529
91
- - name: NVIDIA A100-SXM4-80GB
92
- memory_total: '85899345920'
93
- cuda_cores: 6912
94
- architecture: Ampere
95
- uuid: GPU-a340dca6-1db9-f578-76f2-cf36f74ffabd
96
- - name: NVIDIA A100-SXM4-80GB
97
- memory_total: '85899345920'
98
- cuda_cores: 6912
99
- architecture: Ampere
100
- uuid: GPU-c1bddabf-aa88-9c8f-eec2-6dc3e117f985
101
- - name: NVIDIA A100-SXM4-80GB
102
- memory_total: '85899345920'
103
- cuda_cores: 6912
104
- architecture: Ampere
105
- uuid: GPU-4096c1e7-0437-6727-096f-d67141c140b8
106
- - name: NVIDIA A100-SXM4-80GB
107
- memory_total: '85899345920'
108
- cuda_cores: 6912
109
- architecture: Ampere
110
- uuid: GPU-eeb896c0-61d6-8380-778b-d02101078a17
111
- - name: NVIDIA A100-SXM4-80GB
112
- memory_total: '85899345920'
113
- cuda_cores: 6912
114
- architecture: Ampere
115
- uuid: GPU-d5c1ed79-76e3-22a6-8908-df289b090c03
116
- - name: NVIDIA A100-SXM4-80GB
117
- memory_total: '85899345920'
118
- cuda_cores: 6912
119
- architecture: Ampere
120
- uuid: GPU-6d90b060-f6f7-599b-f939-4ba124ff11b7
121
- cuda_version: '12.8'
122
- writer_id: gkv6pcimbk2w6ig5eqnc01n6qgq9ed3l
123
- text_model_name:
124
- desc: null
125
- value: google/siglip-so400m-patch14-384
126
- vision_model_name:
127
- desc: null
128
- value: google/siglip-so400m-patch14-384
129
- run_name:
130
- desc: null
131
- value: dit_action_train_20250718_161918
132
- save_folder:
133
- desc: null
134
- value: /mnt/data/zhangjian/a1/libero_spatial_dit_action
135
- seed:
136
- desc: null
137
- value: 42
138
- max_steps:
139
- desc: null
140
- value: 100000
141
- global_batch_size:
142
- desc: null
143
- value: 128
144
- device_batch_size:
145
- desc: null
146
- value: 32
147
- learning_rate:
148
- desc: null
149
- value: 2.0e-05
150
- weight_decay:
151
- desc: null
152
- value: 0.01
153
- warmup_steps:
154
- desc: null
155
- value: 500
156
- dataset_name:
157
- desc: null
158
- value: libero_spatial_no_noops
159
- data_root_dir:
160
- desc: null
161
- value: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
162
- use_wrist_image:
163
- desc: null
164
- value: true
165
- use_proprio:
166
- desc: null
167
- value: true
168
- sequence_length:
169
- desc: null
170
- value: 384
171
- num_workers:
172
- desc: null
173
- value: 0
174
- num_diffusion_steps:
175
- desc: null
176
- value: 1000
177
- num_diffusion_inference_steps:
178
- desc: null
179
- value: 30
180
- lang_cond_dim:
181
- desc: null
182
- value: 1152
183
- img_cond_dim:
184
- desc: null
185
- value: 1152
186
- num_patches:
187
- desc: null
188
- value: 729
189
- dit_hidden_dim:
190
- desc: null
191
- value: 2048
192
- dit_depth:
193
- desc: null
194
- value: 28
195
- dit_num_heads:
196
- desc: null
197
- value: 16
198
- save_interval:
199
- desc: null
200
- value: 1000
201
- eval_interval:
202
- desc: null
203
- value: 500
204
- log_interval:
205
- desc: null
206
- value: 10
207
- save_num_checkpoints_to_keep:
208
- desc: null
209
- value: 3
210
- save_overwrite:
211
- desc: null
212
- value: true
213
- precision:
214
- desc: null
215
- value: amp_bf16
216
- gradient_accumulation_steps:
217
- desc: null
218
- value: 1
219
- max_grad_norm:
220
- desc: null
221
- value: 1.0
222
- wandb_project:
223
- desc: null
224
- value: a1-dit-action-20.47
225
- wandb_entity:
226
- desc: null
227
- value: demo0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_161945-m8wsmtst/files/output.log DELETED
@@ -1,94 +0,0 @@
1
- Traceback (most recent call last):
2
- File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 216, in main
3
- trainer.fit()
4
- File "/home/zhangjian/A1/olmo/train.py", line 2796, in fit
5
- metrics = self.train_step(batch)
6
- File "/home/zhangjian/A1/olmo/train.py", line 2732, in train_step
7
- text_embeds = self.text_model(input_ids=batch["input_ids"],attention_mask=batch.get("attention_mask")).last_hidden_state.detach()
8
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
9
- return self._call_impl(*args, **kwargs)
10
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
11
- return forward_call(*args, **kwargs)
12
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
13
- output = func(self, *args, **kwargs)
14
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 739, in forward
15
- return self.text_model(
16
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
17
- return self._call_impl(*args, **kwargs)
18
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
19
- return forward_call(*args, **kwargs)
20
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
21
- output = func(self, *args, **kwargs)
22
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 662, in forward
23
- hidden_states = self.embeddings(input_ids=input_ids, position_ids=position_ids)
24
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
25
- return self._call_impl(*args, **kwargs)
26
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
27
- return forward_call(*args, **kwargs)
28
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 308, in forward
29
- raise ValueError(
30
- ValueError: Sequence length must be less than max_position_embeddings (got `sequence length`: 384 and max_position_embeddings: 64
31
- Traceback (most recent call last):
32
- File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 236, in <module>
33
- main()
34
- File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 216, in main
35
- trainer.fit()
36
- File "/home/zhangjian/A1/olmo/train.py", line 2796, in fit
37
- metrics = self.train_step(batch)
38
- File "/home/zhangjian/A1/olmo/train.py", line 2732, in train_step
39
- text_embeds = self.text_model(input_ids=batch["input_ids"],attention_mask=batch.get("attention_mask")).last_hidden_state.detach()
40
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
41
- return self._call_impl(*args, **kwargs)
42
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
43
- return forward_call(*args, **kwargs)
44
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
45
- output = func(self, *args, **kwargs)
46
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 739, in forward
47
- return self.text_model(
48
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
49
- return self._call_impl(*args, **kwargs)
50
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
51
- return forward_call(*args, **kwargs)
52
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
53
- output = func(self, *args, **kwargs)
54
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 662, in forward
55
- hidden_states = self.embeddings(input_ids=input_ids, position_ids=position_ids)
56
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
57
- return self._call_impl(*args, **kwargs)
58
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
59
- return forward_call(*args, **kwargs)
60
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 308, in forward
61
- raise ValueError(
62
- ValueError: Sequence length must be less than max_position_embeddings (got `sequence length`: 384 and max_position_embeddings: 64
63
- [rank0]: Traceback (most recent call last):
64
- [rank0]: File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 236, in <module>
65
- [rank0]: main()
66
- [rank0]: File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 216, in main
67
- [rank0]: trainer.fit()
68
- [rank0]: File "/home/zhangjian/A1/olmo/train.py", line 2796, in fit
69
- [rank0]: metrics = self.train_step(batch)
70
- [rank0]: File "/home/zhangjian/A1/olmo/train.py", line 2732, in train_step
71
- [rank0]: text_embeds = self.text_model(input_ids=batch["input_ids"],attention_mask=batch.get("attention_mask")).last_hidden_state.detach()
72
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
73
- [rank0]: return self._call_impl(*args, **kwargs)
74
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
75
- [rank0]: return forward_call(*args, **kwargs)
76
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
77
- [rank0]: output = func(self, *args, **kwargs)
78
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 739, in forward
79
- [rank0]: return self.text_model(
80
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
81
- [rank0]: return self._call_impl(*args, **kwargs)
82
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
83
- [rank0]: return forward_call(*args, **kwargs)
84
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
85
- [rank0]: output = func(self, *args, **kwargs)
86
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 662, in forward
87
- [rank0]: hidden_states = self.embeddings(input_ids=input_ids, position_ids=position_ids)
88
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
89
- [rank0]: return self._call_impl(*args, **kwargs)
90
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
91
- [rank0]: return forward_call(*args, **kwargs)
92
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 308, in forward
93
- [rank0]: raise ValueError(
94
- [rank0]: ValueError: Sequence length must be less than max_position_embeddings (got `sequence length`: 384 and max_position_embeddings: 64
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_161945-m8wsmtst/files/requirements.txt DELETED
@@ -1,262 +0,0 @@
1
- ai2-molmo==0.0.0
2
- yarl==1.20.1
3
- astunparse==1.6.3
4
- nvidia-cudnn-cu12==9.5.1.17
5
- etils==1.13.0
6
- tensorflow-io-gcs-filesystem==0.37.1
7
- Brotli==1.1.0
8
- gcsfs==2023.9.2
9
- multiprocess==0.70.16
10
- packaging==25.0
11
- idna==3.10
12
- absl-py==2.3.1
13
- id==1.5.0
14
- einops==0.8.1
15
- rich==13.9.4
16
- editdistance==0.8.1
17
- trouting==0.3.3
18
- mypy==1.3.0
19
- distro==1.9.0
20
- cycler==0.12.1
21
- s3transfer==0.13.0
22
- pyarrow==20.0.0
23
- sentry-sdk==2.33.0
24
- toml==0.10.2
25
- GitPython==3.1.44
26
- click==8.2.1
27
- ai2-molmo==0.0.0
28
- tensorflow-datasets==4.9.9
29
- tqdm==4.67.1
30
- safetensors==0.5.3
31
- google-auth==2.40.3
32
- iniconfig==2.1.0
33
- smmap==5.0.2
34
- nvidia-cublas-cu12==12.6.4.1
35
- wheel==0.45.1
36
- pluggy==1.6.0
37
- filelock==3.18.0
38
- google-auth-oauthlib==1.2.2
39
- httpx==0.28.1
40
- pyasn1==0.6.1
41
- typing-inspection==0.4.1
42
- pydub==0.25.1
43
- nvidia-cusparselt-cu12==0.6.3
44
- decorator==5.2.1
45
- frozenlist==1.7.0
46
- backports.tarfile==1.2.0
47
- setuptools==78.1.1
48
- keras==2.15.0
49
- MarkupSafe==3.0.2
50
- libclang==18.1.1
51
- necessary==0.4.3
52
- cached_path==1.7.3
53
- Jinja2==3.1.6
54
- beaker-py==2.4.6
55
- requests-toolbelt==1.0.0
56
- contourpy==1.3.2
57
- python-multipart==0.0.20
58
- nvidia-cusolver-cu12==11.7.1.2
59
- sentencepiece==0.2.0
60
- cffi==1.17.1
61
- gast==0.6.0
62
- nvidia-curand-cu12==10.3.7.77
63
- six==1.17.0
64
- boto3==1.39.5
65
- annotated-types==0.7.0
66
- termcolor==3.1.0
67
- pyparsing==3.2.3
68
- pydantic_core==2.33.2
69
- rfc3986==2.0.0
70
- pydantic==2.11.7
71
- jiter==0.10.0
72
- jaraco.context==6.0.1
73
- importlib_resources==6.5.2
74
- typeguard==2.13.3
75
- nltk==3.9.1
76
- opt_einsum==3.4.0
77
- grpcio==1.73.1
78
- pathspec==0.12.1
79
- triton==3.3.1
80
- gradio==5.37.0
81
- nvidia-nccl-cu12==2.26.2
82
- smart_open==7.3.0.post1
83
- scikit-learn==1.7.0
84
- pytest-sphinx==0.6.3
85
- google-cloud-core==2.4.3
86
- rsa==4.9.1
87
- readme_renderer==44.0
88
- httpcore==1.0.9
89
- threadpoolctl==3.6.0
90
- fsspec==2023.9.2
91
- keyring==25.6.0
92
- aiohttp==3.12.14
93
- attrs==25.3.0
94
- mypy_extensions==1.1.0
95
- antlr4-python3-runtime==4.9.3
96
- orjson==3.11.0
97
- cachetools==5.5.2
98
- requests==2.32.4
99
- smashed==0.21.5
100
- nvidia-cuda-cupti-cu12==12.6.80
101
- aiosignal==1.4.0
102
- torch==2.7.1
103
- xxhash==3.5.0
104
- OpenEXR==3.3.4
105
- cached-property==2.0.1
106
- wcwidth==0.2.13
107
- uvicorn==0.35.0
108
- numpy==1.26.4
109
- flatbuffers==25.2.10
110
- torchmetrics==1.7.4
111
- ftfy==6.3.1
112
- dill==0.3.8
113
- multidict==6.6.3
114
- shellingham==1.5.4
115
- promise==2.3
116
- anyio==4.9.0
117
- regex==2024.11.6
118
- tensorflow-graphics==2021.12.3
119
- pycparser==2.22
120
- nvidia-cuda-runtime-cu12==12.6.77
121
- matplotlib==3.10.3
122
- google-cloud-storage==2.19.0
123
- botocore==1.39.5
124
- click-option-group==0.5.7
125
- pytz==2025.2
126
- fonttools==4.58.5
127
- pyproject_hooks==1.2.0
128
- google-crc32c==1.7.1
129
- Markdown==3.8.2
130
- requests-oauthlib==2.0.0
131
- dlimp==0.0.1
132
- nvidia-cuda-nvrtc-cu12==12.6.77
133
- tomlkit==0.13.3
134
- safehttpx==0.1.6
135
- nvidia-cufft-cu12==11.3.0.4
136
- jmespath==1.0.1
137
- protobuf==4.21.12
138
- nvidia-nvtx-cu12==12.6.77
139
- tensorflow-addons==0.23.0
140
- jaraco.classes==3.4.0
141
- aiofiles==24.1.0
142
- exceptiongroup==1.3.0
143
- libcst==1.8.2
144
- immutabledict==4.2.1
145
- oauthlib==3.3.1
146
- timm==1.0.16
147
- lightning-utilities==0.14.3
148
- jeepney==0.9.0
149
- certifi==2025.7.14
150
- docutils==0.21.2
151
- markdown-it-py==3.0.0
152
- proto-plus==1.26.1
153
- wrapt==1.14.1
154
- mdurl==0.1.2
155
- more-itertools==10.7.0
156
- platformdirs==4.3.8
157
- kiwisolver==1.4.8
158
- tensorboard-data-server==0.7.2
159
- propcache==0.3.2
160
- zipp==3.23.0
161
- Werkzeug==3.1.3
162
- wandb==0.21.0
163
- Levenshtein==0.27.1
164
- isort==5.12.0
165
- simple-parsing==0.1.7
166
- face==24.0.0
167
- tzdata==2025.2
168
- h5py==3.14.0
169
- psutil==7.0.0
170
- mpmath==1.3.0
171
- dm-tree==0.1.9
172
- tensorflow-estimator==2.15.0
173
- pip==25.1
174
- joblib==1.5.1
175
- pyasn1_modules==0.4.2
176
- RapidFuzz==3.13.0
177
- cryptography==45.0.5
178
- typing_extensions==4.14.1
179
- urllib3==2.5.0
180
- sniffio==1.3.1
181
- omegaconf==2.3.0
182
- h11==0.16.0
183
- nvidia-cusparse-cu12==12.5.4.2
184
- click-help-colors==0.9.4
185
- einops-exts==0.0.4
186
- scipy==1.15.3
187
- nvidia-cufile-cu12==1.11.1.6
188
- huggingface-hub==0.33.4
189
- PyYAML==6.0.2
190
- pandas==2.3.1
191
- python-dateutil==2.9.0.post0
192
- petname==2.6
193
- tensorboard==2.15.2
194
- python-Levenshtein==0.27.1
195
- graphviz==0.21
196
- datasets==4.0.0
197
- gradio_client==1.10.4
198
- networkx==3.4.2
199
- nh3==0.2.22
200
- jaraco.functools==4.2.1
201
- ml-dtypes==0.2.0
202
- gitdb==4.0.12
203
- google-pasta==0.2.0
204
- openai==1.96.1
205
- aiohappyeyeballs==2.6.1
206
- docstring_parser==0.16
207
- build==1.2.2.post1
208
- tokenizers==0.21.2
209
- black==23.12.1
210
- fiddle==0.3.0
211
- requirements-parser==0.13.0
212
- ruff==0.12.3
213
- trimesh==4.7.0
214
- Pygments==2.19.2
215
- google-resumable-media==2.7.2
216
- async-timeout==5.0.1
217
- hf-xet==1.1.5
218
- groovy==0.1.2
219
- accelerate==1.8.1
220
- diffusers==0.33.1
221
- SecretStorage==3.3.3
222
- ffmpy==0.6.0
223
- websockets==15.0.1
224
- fastapi==0.116.1
225
- importlib_metadata==8.7.0
226
- pillow==11.3.0
227
- nvidia-nvjitlink-cu12==12.6.85
228
- beaker-gantry==2.8.3
229
- glom==24.11.0
230
- transformers==4.53.2
231
- pytest==8.4.1
232
- tensorflow==2.15.0
233
- semantic-version==2.10.0
234
- charset-normalizer==3.4.2
235
- tensorflow-metadata==1.17.2
236
- googleapis-common-protos==1.70.0
237
- boltons==25.0.0
238
- twine==6.1.0
239
- tomli==2.2.1
240
- google-api-core==2.25.1
241
- typer==0.16.0
242
- sympy==1.14.0
243
- starlette==0.47.1
244
- msgspec==0.19.0
245
- array_record==0.7.2
246
- torchvision==0.22.1
247
- typing_extensions==4.12.2
248
- wheel==0.45.1
249
- backports.tarfile==1.2.0
250
- inflect==7.3.1
251
- zipp==3.19.2
252
- jaraco.collections==5.1.0
253
- jaraco.text==3.12.1
254
- jaraco.context==5.3.0
255
- jaraco.functools==4.0.1
256
- tomli==2.0.1
257
- platformdirs==4.2.2
258
- packaging==24.2
259
- typeguard==4.3.0
260
- importlib_metadata==8.0.0
261
- more-itertools==10.3.0
262
- autocommand==2.2.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_161945-m8wsmtst/files/wandb-metadata.json DELETED
@@ -1 +0,0 @@
1
- {"os": "Linux-5.15.0-142-generic-x86_64-with-glibc2.35", "python": "CPython 3.10.16", "started_at": "2025-07-18T08:19:45.826177Z", "args": ["--save_folder=/mnt/data/zhangjian/a1/libero_spatial_dit_action", "--save_overwrite"], "program": "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", "code_path": "launch_scripts/train_vla_dit_action.py", "code_path_local": "launch_scripts/train_vla_dit_action.py", "git": {"remote_url": "https://github.com/Spatialtemporal-AI/A1.git", "commit": "2e05e206652258f5fbb178ec13c792c2a91c1856"}, "root": "/home/zhangjian/A1", "host": "iv-ydwxzrkf0gvr6okuck21", "executable": "/mnt/data/zhangjian/miniconda3/envs/a1/bin/python3.10", "cpu_count": 56, "cpu_count_logical": 112, "gpu_type": "NVIDIA A100-SXM4-80GB", "gpu_count": 8, "disk": {"/": {"total": "507024936960", "used": "133182132224"}}, "memory": {"total": "2071488372736"}, "gpu_nvidia": [{"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-b01b938f-1b95-8587-4b93-cfa68d84c935"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-49b283f0-f1e6-992d-4ed8-99855a5e6529"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-a340dca6-1db9-f578-76f2-cf36f74ffabd"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-c1bddabf-aa88-9c8f-eec2-6dc3e117f985"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-4096c1e7-0437-6727-096f-d67141c140b8"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-eeb896c0-61d6-8380-778b-d02101078a17"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-d5c1ed79-76e3-22a6-8908-df289b090c03"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-6d90b060-f6f7-599b-f939-4ba124ff11b7"}], "cuda_version": "12.8", "writer_id": "gkv6pcimbk2w6ig5eqnc01n6qgq9ed3l"}
 
 
wandb/offline-run-20250718_161945-m8wsmtst/files/wandb-summary.json DELETED
@@ -1 +0,0 @@
1
- {"_runtime": 6}
 
 
wandb/offline-run-20250718_161945-m8wsmtst/logs/debug-core.log DELETED
@@ -1,14 +0,0 @@
1
- {"time":"2025-07-18T16:19:45.856929542+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmph2yqu36w/port-2874027.txt","pid":2874027,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
- {"time":"2025-07-18T16:19:45.857509675+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":2874027}
3
- {"time":"2025-07-18T16:19:45.8575527+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2874027-2876426-2611772877/socket","Net":"unix"}}
4
- {"time":"2025-07-18T16:19:46.034393648+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
- {"time":"2025-07-18T16:19:46.038087649+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"m8wsmtst","id":"1(@)"}
6
- {"time":"2025-07-18T16:19:46.157222198+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"m8wsmtst","id":"1(@)"}
7
- {"time":"2025-07-18T16:19:52.167429191+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
- {"time":"2025-07-18T16:19:52.167510001+08:00","level":"INFO","msg":"server is shutting down"}
9
- {"time":"2025-07-18T16:19:52.16750131+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
- {"time":"2025-07-18T16:19:52.167581797+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
11
- {"time":"2025-07-18T16:19:52.167604834+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2874027-2876426-2611772877/socket","Net":"unix"}}
12
- {"time":"2025-07-18T16:19:52.169166335+08:00","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
13
- {"time":"2025-07-18T16:19:52.169190878+08:00","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
14
- {"time":"2025-07-18T16:19:52.169201032+08:00","level":"INFO","msg":"server is closed"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_161945-m8wsmtst/logs/debug-internal.log DELETED
@@ -1,13 +0,0 @@
1
- {"time":"2025-07-18T16:19:46.042031385+08:00","level":"INFO","msg":"stream: starting","core version":"0.21.0"}
2
- {"time":"2025-07-18T16:19:46.157051193+08:00","level":"WARN","msg":"GraphQL client is nil, skipping feature loading"}
3
- {"time":"2025-07-18T16:19:46.157197135+08:00","level":"INFO","msg":"stream: created new stream","id":"m8wsmtst"}
4
- {"time":"2025-07-18T16:19:46.157216504+08:00","level":"INFO","msg":"stream: started","id":"m8wsmtst"}
5
- {"time":"2025-07-18T16:19:46.157229719+08:00","level":"INFO","msg":"writer: Do: started","stream_id":"m8wsmtst"}
6
- {"time":"2025-07-18T16:19:46.157247709+08:00","level":"INFO","msg":"handler: started","stream_id":"m8wsmtst"}
7
- {"time":"2025-07-18T16:19:46.15725118+08:00","level":"INFO","msg":"sender: started","stream_id":"m8wsmtst"}
8
- {"time":"2025-07-18T16:19:46.157739142+08:00","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
9
- {"time":"2025-07-18T16:19:52.167599755+08:00","level":"INFO","msg":"stream: closing","id":"m8wsmtst"}
10
- {"time":"2025-07-18T16:19:52.167794108+08:00","level":"INFO","msg":"handler: closed","stream_id":"m8wsmtst"}
11
- {"time":"2025-07-18T16:19:52.167820176+08:00","level":"INFO","msg":"writer: Close: closed","stream_id":"m8wsmtst"}
12
- {"time":"2025-07-18T16:19:52.167839497+08:00","level":"INFO","msg":"sender: closed","stream_id":"m8wsmtst"}
13
- {"time":"2025-07-18T16:19:52.167887348+08:00","level":"INFO","msg":"stream: closed","id":"m8wsmtst"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_161945-m8wsmtst/logs/debug.log DELETED
File without changes
wandb/offline-run-20250718_161945-m8wsmtst/run-m8wsmtst.wandb DELETED
Binary file (14.5 kB)
 
wandb/offline-run-20250718_161945-m8wsmtst/run-m8wsmtst.wandb.synced DELETED
File without changes
wandb/offline-run-20250718_162533-enh8w5nh/files/output.log DELETED
File without changes
wandb/offline-run-20250718_162533-enh8w5nh/files/requirements.txt DELETED
@@ -1,262 +0,0 @@
1
- ai2-molmo==0.0.0
2
- yarl==1.20.1
3
- astunparse==1.6.3
4
- nvidia-cudnn-cu12==9.5.1.17
5
- etils==1.13.0
6
- tensorflow-io-gcs-filesystem==0.37.1
7
- Brotli==1.1.0
8
- gcsfs==2023.9.2
9
- multiprocess==0.70.16
10
- packaging==25.0
11
- idna==3.10
12
- absl-py==2.3.1
13
- id==1.5.0
14
- einops==0.8.1
15
- rich==13.9.4
16
- editdistance==0.8.1
17
- trouting==0.3.3
18
- mypy==1.3.0
19
- distro==1.9.0
20
- cycler==0.12.1
21
- s3transfer==0.13.0
22
- pyarrow==20.0.0
23
- sentry-sdk==2.33.0
24
- toml==0.10.2
25
- GitPython==3.1.44
26
- click==8.2.1
27
- ai2-molmo==0.0.0
28
- tensorflow-datasets==4.9.9
29
- tqdm==4.67.1
30
- safetensors==0.5.3
31
- google-auth==2.40.3
32
- iniconfig==2.1.0
33
- smmap==5.0.2
34
- nvidia-cublas-cu12==12.6.4.1
35
- wheel==0.45.1
36
- pluggy==1.6.0
37
- filelock==3.18.0
38
- google-auth-oauthlib==1.2.2
39
- httpx==0.28.1
40
- pyasn1==0.6.1
41
- typing-inspection==0.4.1
42
- pydub==0.25.1
43
- nvidia-cusparselt-cu12==0.6.3
44
- decorator==5.2.1
45
- frozenlist==1.7.0
46
- backports.tarfile==1.2.0
47
- setuptools==78.1.1
48
- keras==2.15.0
49
- MarkupSafe==3.0.2
50
- libclang==18.1.1
51
- necessary==0.4.3
52
- cached_path==1.7.3
53
- Jinja2==3.1.6
54
- beaker-py==2.4.6
55
- requests-toolbelt==1.0.0
56
- contourpy==1.3.2
57
- python-multipart==0.0.20
58
- nvidia-cusolver-cu12==11.7.1.2
59
- sentencepiece==0.2.0
60
- cffi==1.17.1
61
- gast==0.6.0
62
- nvidia-curand-cu12==10.3.7.77
63
- six==1.17.0
64
- boto3==1.39.5
65
- annotated-types==0.7.0
66
- termcolor==3.1.0
67
- pyparsing==3.2.3
68
- pydantic_core==2.33.2
69
- rfc3986==2.0.0
70
- pydantic==2.11.7
71
- jiter==0.10.0
72
- jaraco.context==6.0.1
73
- importlib_resources==6.5.2
74
- typeguard==2.13.3
75
- nltk==3.9.1
76
- opt_einsum==3.4.0
77
- grpcio==1.73.1
78
- pathspec==0.12.1
79
- triton==3.3.1
80
- gradio==5.37.0
81
- nvidia-nccl-cu12==2.26.2
82
- smart_open==7.3.0.post1
83
- scikit-learn==1.7.0
84
- pytest-sphinx==0.6.3
85
- google-cloud-core==2.4.3
86
- rsa==4.9.1
87
- readme_renderer==44.0
88
- httpcore==1.0.9
89
- threadpoolctl==3.6.0
90
- fsspec==2023.9.2
91
- keyring==25.6.0
92
- aiohttp==3.12.14
93
- attrs==25.3.0
94
- mypy_extensions==1.1.0
95
- antlr4-python3-runtime==4.9.3
96
- orjson==3.11.0
97
- cachetools==5.5.2
98
- requests==2.32.4
99
- smashed==0.21.5
100
- nvidia-cuda-cupti-cu12==12.6.80
101
- aiosignal==1.4.0
102
- torch==2.7.1
103
- xxhash==3.5.0
104
- OpenEXR==3.3.4
105
- cached-property==2.0.1
106
- wcwidth==0.2.13
107
- uvicorn==0.35.0
108
- numpy==1.26.4
109
- flatbuffers==25.2.10
110
- torchmetrics==1.7.4
111
- ftfy==6.3.1
112
- dill==0.3.8
113
- multidict==6.6.3
114
- shellingham==1.5.4
115
- promise==2.3
116
- anyio==4.9.0
117
- regex==2024.11.6
118
- tensorflow-graphics==2021.12.3
119
- pycparser==2.22
120
- nvidia-cuda-runtime-cu12==12.6.77
121
- matplotlib==3.10.3
122
- google-cloud-storage==2.19.0
123
- botocore==1.39.5
124
- click-option-group==0.5.7
125
- pytz==2025.2
126
- fonttools==4.58.5
127
- pyproject_hooks==1.2.0
128
- google-crc32c==1.7.1
129
- Markdown==3.8.2
130
- requests-oauthlib==2.0.0
131
- dlimp==0.0.1
132
- nvidia-cuda-nvrtc-cu12==12.6.77
133
- tomlkit==0.13.3
134
- safehttpx==0.1.6
135
- nvidia-cufft-cu12==11.3.0.4
136
- jmespath==1.0.1
137
- protobuf==4.21.12
138
- nvidia-nvtx-cu12==12.6.77
139
- tensorflow-addons==0.23.0
140
- jaraco.classes==3.4.0
141
- aiofiles==24.1.0
142
- exceptiongroup==1.3.0
143
- libcst==1.8.2
144
- immutabledict==4.2.1
145
- oauthlib==3.3.1
146
- timm==1.0.16
147
- lightning-utilities==0.14.3
148
- jeepney==0.9.0
149
- certifi==2025.7.14
150
- docutils==0.21.2
151
- markdown-it-py==3.0.0
152
- proto-plus==1.26.1
153
- wrapt==1.14.1
154
- mdurl==0.1.2
155
- more-itertools==10.7.0
156
- platformdirs==4.3.8
157
- kiwisolver==1.4.8
158
- tensorboard-data-server==0.7.2
159
- propcache==0.3.2
160
- zipp==3.23.0
161
- Werkzeug==3.1.3
162
- wandb==0.21.0
163
- Levenshtein==0.27.1
164
- isort==5.12.0
165
- simple-parsing==0.1.7
166
- face==24.0.0
167
- tzdata==2025.2
168
- h5py==3.14.0
169
- psutil==7.0.0
170
- mpmath==1.3.0
171
- dm-tree==0.1.9
172
- tensorflow-estimator==2.15.0
173
- pip==25.1
174
- joblib==1.5.1
175
- pyasn1_modules==0.4.2
176
- RapidFuzz==3.13.0
177
- cryptography==45.0.5
178
- typing_extensions==4.14.1
179
- urllib3==2.5.0
180
- sniffio==1.3.1
181
- omegaconf==2.3.0
182
- h11==0.16.0
183
- nvidia-cusparse-cu12==12.5.4.2
184
- click-help-colors==0.9.4
185
- einops-exts==0.0.4
186
- scipy==1.15.3
187
- nvidia-cufile-cu12==1.11.1.6
188
- huggingface-hub==0.33.4
189
- PyYAML==6.0.2
190
- pandas==2.3.1
191
- python-dateutil==2.9.0.post0
192
- petname==2.6
193
- tensorboard==2.15.2
194
- python-Levenshtein==0.27.1
195
- graphviz==0.21
196
- datasets==4.0.0
197
- gradio_client==1.10.4
198
- networkx==3.4.2
199
- nh3==0.2.22
200
- jaraco.functools==4.2.1
201
- ml-dtypes==0.2.0
202
- gitdb==4.0.12
203
- google-pasta==0.2.0
204
- openai==1.96.1
205
- aiohappyeyeballs==2.6.1
206
- docstring_parser==0.16
207
- build==1.2.2.post1
208
- tokenizers==0.21.2
209
- black==23.12.1
210
- fiddle==0.3.0
211
- requirements-parser==0.13.0
212
- ruff==0.12.3
213
- trimesh==4.7.0
214
- Pygments==2.19.2
215
- google-resumable-media==2.7.2
216
- async-timeout==5.0.1
217
- hf-xet==1.1.5
218
- groovy==0.1.2
219
- accelerate==1.8.1
220
- diffusers==0.33.1
221
- SecretStorage==3.3.3
222
- ffmpy==0.6.0
223
- websockets==15.0.1
224
- fastapi==0.116.1
225
- importlib_metadata==8.7.0
226
- pillow==11.3.0
227
- nvidia-nvjitlink-cu12==12.6.85
228
- beaker-gantry==2.8.3
229
- glom==24.11.0
230
- transformers==4.53.2
231
- pytest==8.4.1
232
- tensorflow==2.15.0
233
- semantic-version==2.10.0
234
- charset-normalizer==3.4.2
235
- tensorflow-metadata==1.17.2
236
- googleapis-common-protos==1.70.0
237
- boltons==25.0.0
238
- twine==6.1.0
239
- tomli==2.2.1
240
- google-api-core==2.25.1
241
- typer==0.16.0
242
- sympy==1.14.0
243
- starlette==0.47.1
244
- msgspec==0.19.0
245
- array_record==0.7.2
246
- torchvision==0.22.1
247
- typing_extensions==4.12.2
248
- wheel==0.45.1
249
- backports.tarfile==1.2.0
250
- inflect==7.3.1
251
- zipp==3.19.2
252
- jaraco.collections==5.1.0
253
- jaraco.text==3.12.1
254
- jaraco.context==5.3.0
255
- jaraco.functools==4.0.1
256
- tomli==2.0.1
257
- platformdirs==4.2.2
258
- packaging==24.2
259
- typeguard==4.3.0
260
- importlib_metadata==8.0.0
261
- more-itertools==10.3.0
262
- autocommand==2.2.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_162533-enh8w5nh/logs/debug-core.log DELETED
@@ -1,7 +0,0 @@
1
- {"time":"2025-07-18T16:25:33.048887646+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpo5iypyp2/port-2884717.txt","pid":2884717,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
- {"time":"2025-07-18T16:25:33.049416652+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":2884717}
3
- {"time":"2025-07-18T16:25:33.049407439+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2884717-2886714-2553117481/socket","Net":"unix"}}
4
- {"time":"2025-07-18T16:25:33.227775424+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
- {"time":"2025-07-18T16:25:33.231715039+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"enh8w5nh","id":"1(@)"}
6
- {"time":"2025-07-18T16:25:33.349089165+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"enh8w5nh","id":"1(@)"}
7
- {"time":"2025-07-18T16:25:38.161645631+08:00","level":"INFO","msg":"server: parent process exited, terminating service process"}
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_162533-enh8w5nh/logs/debug-internal.log DELETED
@@ -1,8 +0,0 @@
1
- {"time":"2025-07-18T16:25:33.23556091+08:00","level":"INFO","msg":"stream: starting","core version":"0.21.0"}
2
- {"time":"2025-07-18T16:25:33.348898335+08:00","level":"WARN","msg":"GraphQL client is nil, skipping feature loading"}
3
- {"time":"2025-07-18T16:25:33.349063018+08:00","level":"INFO","msg":"stream: created new stream","id":"enh8w5nh"}
4
- {"time":"2025-07-18T16:25:33.349083407+08:00","level":"INFO","msg":"stream: started","id":"enh8w5nh"}
5
- {"time":"2025-07-18T16:25:33.349099668+08:00","level":"INFO","msg":"writer: Do: started","stream_id":"enh8w5nh"}
6
- {"time":"2025-07-18T16:25:33.349118419+08:00","level":"INFO","msg":"sender: started","stream_id":"enh8w5nh"}
7
- {"time":"2025-07-18T16:25:33.349126683+08:00","level":"INFO","msg":"handler: started","stream_id":"enh8w5nh"}
8
- {"time":"2025-07-18T16:25:33.349658731+08:00","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_162533-enh8w5nh/logs/debug.log DELETED
File without changes
wandb/offline-run-20250718_162533-enh8w5nh/run-enh8w5nh.wandb DELETED
File without changes
wandb/offline-run-20250718_162819-6btqdhbk/files/output.log DELETED
File without changes
wandb/offline-run-20250718_162819-6btqdhbk/files/requirements.txt DELETED
@@ -1,262 +0,0 @@
1
- ai2-molmo==0.0.0
2
- yarl==1.20.1
3
- astunparse==1.6.3
4
- nvidia-cudnn-cu12==9.5.1.17
5
- etils==1.13.0
6
- tensorflow-io-gcs-filesystem==0.37.1
7
- Brotli==1.1.0
8
- gcsfs==2023.9.2
9
- multiprocess==0.70.16
10
- packaging==25.0
11
- idna==3.10
12
- absl-py==2.3.1
13
- id==1.5.0
14
- einops==0.8.1
15
- rich==13.9.4
16
- editdistance==0.8.1
17
- trouting==0.3.3
18
- mypy==1.3.0
19
- distro==1.9.0
20
- cycler==0.12.1
21
- s3transfer==0.13.0
22
- pyarrow==20.0.0
23
- sentry-sdk==2.33.0
24
- toml==0.10.2
25
- GitPython==3.1.44
26
- click==8.2.1
27
- ai2-molmo==0.0.0
28
- tensorflow-datasets==4.9.9
29
- tqdm==4.67.1
30
- safetensors==0.5.3
31
- google-auth==2.40.3
32
- iniconfig==2.1.0
33
- smmap==5.0.2
34
- nvidia-cublas-cu12==12.6.4.1
35
- wheel==0.45.1
36
- pluggy==1.6.0
37
- filelock==3.18.0
38
- google-auth-oauthlib==1.2.2
39
- httpx==0.28.1
40
- pyasn1==0.6.1
41
- typing-inspection==0.4.1
42
- pydub==0.25.1
43
- nvidia-cusparselt-cu12==0.6.3
44
- decorator==5.2.1
45
- frozenlist==1.7.0
46
- backports.tarfile==1.2.0
47
- setuptools==78.1.1
48
- keras==2.15.0
49
- MarkupSafe==3.0.2
50
- libclang==18.1.1
51
- necessary==0.4.3
52
- cached_path==1.7.3
53
- Jinja2==3.1.6
54
- beaker-py==2.4.6
55
- requests-toolbelt==1.0.0
56
- contourpy==1.3.2
57
- python-multipart==0.0.20
58
- nvidia-cusolver-cu12==11.7.1.2
59
- sentencepiece==0.2.0
60
- cffi==1.17.1
61
- gast==0.6.0
62
- nvidia-curand-cu12==10.3.7.77
63
- six==1.17.0
64
- boto3==1.39.5
65
- annotated-types==0.7.0
66
- termcolor==3.1.0
67
- pyparsing==3.2.3
68
- pydantic_core==2.33.2
69
- rfc3986==2.0.0
70
- pydantic==2.11.7
71
- jiter==0.10.0
72
- jaraco.context==6.0.1
73
- importlib_resources==6.5.2
74
- typeguard==2.13.3
75
- nltk==3.9.1
76
- opt_einsum==3.4.0
77
- grpcio==1.73.1
78
- pathspec==0.12.1
79
- triton==3.3.1
80
- gradio==5.37.0
81
- nvidia-nccl-cu12==2.26.2
82
- smart_open==7.3.0.post1
83
- scikit-learn==1.7.0
84
- pytest-sphinx==0.6.3
85
- google-cloud-core==2.4.3
86
- rsa==4.9.1
87
- readme_renderer==44.0
88
- httpcore==1.0.9
89
- threadpoolctl==3.6.0
90
- fsspec==2023.9.2
91
- keyring==25.6.0
92
- aiohttp==3.12.14
93
- attrs==25.3.0
94
- mypy_extensions==1.1.0
95
- antlr4-python3-runtime==4.9.3
96
- orjson==3.11.0
97
- cachetools==5.5.2
98
- requests==2.32.4
99
- smashed==0.21.5
100
- nvidia-cuda-cupti-cu12==12.6.80
101
- aiosignal==1.4.0
102
- torch==2.7.1
103
- xxhash==3.5.0
104
- OpenEXR==3.3.4
105
- cached-property==2.0.1
106
- wcwidth==0.2.13
107
- uvicorn==0.35.0
108
- numpy==1.26.4
109
- flatbuffers==25.2.10
110
- torchmetrics==1.7.4
111
- ftfy==6.3.1
112
- dill==0.3.8
113
- multidict==6.6.3
114
- shellingham==1.5.4
115
- promise==2.3
116
- anyio==4.9.0
117
- regex==2024.11.6
118
- tensorflow-graphics==2021.12.3
119
- pycparser==2.22
120
- nvidia-cuda-runtime-cu12==12.6.77
121
- matplotlib==3.10.3
122
- google-cloud-storage==2.19.0
123
- botocore==1.39.5
124
- click-option-group==0.5.7
125
- pytz==2025.2
126
- fonttools==4.58.5
127
- pyproject_hooks==1.2.0
128
- google-crc32c==1.7.1
129
- Markdown==3.8.2
130
- requests-oauthlib==2.0.0
131
- dlimp==0.0.1
132
- nvidia-cuda-nvrtc-cu12==12.6.77
133
- tomlkit==0.13.3
134
- safehttpx==0.1.6
135
- nvidia-cufft-cu12==11.3.0.4
136
- jmespath==1.0.1
137
- protobuf==4.21.12
138
- nvidia-nvtx-cu12==12.6.77
139
- tensorflow-addons==0.23.0
140
- jaraco.classes==3.4.0
141
- aiofiles==24.1.0
142
- exceptiongroup==1.3.0
143
- libcst==1.8.2
144
- immutabledict==4.2.1
145
- oauthlib==3.3.1
146
- timm==1.0.16
147
- lightning-utilities==0.14.3
148
- jeepney==0.9.0
149
- certifi==2025.7.14
150
- docutils==0.21.2
151
- markdown-it-py==3.0.0
152
- proto-plus==1.26.1
153
- wrapt==1.14.1
154
- mdurl==0.1.2
155
- more-itertools==10.7.0
156
- platformdirs==4.3.8
157
- kiwisolver==1.4.8
158
- tensorboard-data-server==0.7.2
159
- propcache==0.3.2
160
- zipp==3.23.0
161
- Werkzeug==3.1.3
162
- wandb==0.21.0
163
- Levenshtein==0.27.1
164
- isort==5.12.0
165
- simple-parsing==0.1.7
166
- face==24.0.0
167
- tzdata==2025.2
168
- h5py==3.14.0
169
- psutil==7.0.0
170
- mpmath==1.3.0
171
- dm-tree==0.1.9
172
- tensorflow-estimator==2.15.0
173
- pip==25.1
174
- joblib==1.5.1
175
- pyasn1_modules==0.4.2
176
- RapidFuzz==3.13.0
177
- cryptography==45.0.5
178
- typing_extensions==4.14.1
179
- urllib3==2.5.0
180
- sniffio==1.3.1
181
- omegaconf==2.3.0
182
- h11==0.16.0
183
- nvidia-cusparse-cu12==12.5.4.2
184
- click-help-colors==0.9.4
185
- einops-exts==0.0.4
186
- scipy==1.15.3
187
- nvidia-cufile-cu12==1.11.1.6
188
- huggingface-hub==0.33.4
189
- PyYAML==6.0.2
190
- pandas==2.3.1
191
- python-dateutil==2.9.0.post0
192
- petname==2.6
193
- tensorboard==2.15.2
194
- python-Levenshtein==0.27.1
195
- graphviz==0.21
196
- datasets==4.0.0
197
- gradio_client==1.10.4
198
- networkx==3.4.2
199
- nh3==0.2.22
200
- jaraco.functools==4.2.1
201
- ml-dtypes==0.2.0
202
- gitdb==4.0.12
203
- google-pasta==0.2.0
204
- openai==1.96.1
205
- aiohappyeyeballs==2.6.1
206
- docstring_parser==0.16
207
- build==1.2.2.post1
208
- tokenizers==0.21.2
209
- black==23.12.1
210
- fiddle==0.3.0
211
- requirements-parser==0.13.0
212
- ruff==0.12.3
213
- trimesh==4.7.0
214
- Pygments==2.19.2
215
- google-resumable-media==2.7.2
216
- async-timeout==5.0.1
217
- hf-xet==1.1.5
218
- groovy==0.1.2
219
- accelerate==1.8.1
220
- diffusers==0.33.1
221
- SecretStorage==3.3.3
222
- ffmpy==0.6.0
223
- websockets==15.0.1
224
- fastapi==0.116.1
225
- importlib_metadata==8.7.0
226
- pillow==11.3.0
227
- nvidia-nvjitlink-cu12==12.6.85
228
- beaker-gantry==2.8.3
229
- glom==24.11.0
230
- transformers==4.53.2
231
- pytest==8.4.1
232
- tensorflow==2.15.0
233
- semantic-version==2.10.0
234
- charset-normalizer==3.4.2
235
- tensorflow-metadata==1.17.2
236
- googleapis-common-protos==1.70.0
237
- boltons==25.0.0
238
- twine==6.1.0
239
- tomli==2.2.1
240
- google-api-core==2.25.1
241
- typer==0.16.0
242
- sympy==1.14.0
243
- starlette==0.47.1
244
- msgspec==0.19.0
245
- array_record==0.7.2
246
- torchvision==0.22.1
247
- typing_extensions==4.12.2
248
- wheel==0.45.1
249
- backports.tarfile==1.2.0
250
- inflect==7.3.1
251
- zipp==3.19.2
252
- jaraco.collections==5.1.0
253
- jaraco.text==3.12.1
254
- jaraco.context==5.3.0
255
- jaraco.functools==4.0.1
256
- tomli==2.0.1
257
- platformdirs==4.2.2
258
- packaging==24.2
259
- typeguard==4.3.0
260
- importlib_metadata==8.0.0
261
- more-itertools==10.3.0
262
- autocommand==2.2.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_162819-6btqdhbk/logs/debug-core.log DELETED
@@ -1,7 +0,0 @@
1
- {"time":"2025-07-18T16:28:19.409855671+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp0pgj9n56/port-2890422.txt","pid":2890422,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
- {"time":"2025-07-18T16:28:19.410428972+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":2890422}
3
- {"time":"2025-07-18T16:28:19.410449859+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2890422-2892247-2023005874/socket","Net":"unix"}}
4
- {"time":"2025-07-18T16:28:19.589965556+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
- {"time":"2025-07-18T16:28:19.594940331+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"6btqdhbk","id":"1(@)"}
6
- {"time":"2025-07-18T16:28:19.712915229+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"6btqdhbk","id":"1(@)"}
7
- {"time":"2025-07-18T16:28:26.728818238+08:00","level":"INFO","msg":"server: parent process exited, terminating service process"}
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_162819-6btqdhbk/logs/debug-internal.log DELETED
@@ -1,8 +0,0 @@
1
- {"time":"2025-07-18T16:28:19.598579541+08:00","level":"INFO","msg":"stream: starting","core version":"0.21.0"}
2
- {"time":"2025-07-18T16:28:19.712737263+08:00","level":"WARN","msg":"GraphQL client is nil, skipping feature loading"}
3
- {"time":"2025-07-18T16:28:19.712888407+08:00","level":"INFO","msg":"stream: created new stream","id":"6btqdhbk"}
4
- {"time":"2025-07-18T16:28:19.712910248+08:00","level":"INFO","msg":"stream: started","id":"6btqdhbk"}
5
- {"time":"2025-07-18T16:28:19.712932303+08:00","level":"INFO","msg":"writer: Do: started","stream_id":"6btqdhbk"}
6
- {"time":"2025-07-18T16:28:19.712954867+08:00","level":"INFO","msg":"handler: started","stream_id":"6btqdhbk"}
7
- {"time":"2025-07-18T16:28:19.712947454+08:00","level":"INFO","msg":"sender: started","stream_id":"6btqdhbk"}
8
- {"time":"2025-07-18T16:28:19.71364791+08:00","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_162819-6btqdhbk/logs/debug.log DELETED
File without changes
wandb/offline-run-20250718_162819-6btqdhbk/run-6btqdhbk.wandb DELETED
File without changes
wandb/offline-run-20250718_163819-kujhudzv/files/config.yaml DELETED
@@ -1,227 +0,0 @@
1
- wandb_version: 1
2
-
3
- _wandb:
4
- desc: null
5
- value:
6
- python_version: 3.10.16
7
- cli_version: 0.21.0
8
- framework: huggingface
9
- huggingface_version: 4.53.2
10
- is_jupyter_run: false
11
- is_kaggle_kernel: false
12
- start_time: 1752827899
13
- t:
14
- 1:
15
- - 1
16
- - 2
17
- - 3
18
- - 5
19
- - 11
20
- - 41
21
- - 49
22
- - 51
23
- - 53
24
- - 63
25
- - 71
26
- - 83
27
- - 95
28
- - 105
29
- 2:
30
- - 1
31
- - 2
32
- - 3
33
- - 5
34
- - 11
35
- - 41
36
- - 49
37
- - 51
38
- - 53
39
- - 63
40
- - 71
41
- - 83
42
- - 95
43
- - 105
44
- 3:
45
- - 4
46
- - 13
47
- - 16
48
- - 42
49
- 4: 3.10.16
50
- 5: 0.21.0
51
- 6: 4.53.2
52
- 13: linux-x86_64
53
- e:
54
- oygl393zcukmmdj0i9c4b0424qwzehyz:
55
- os: Linux-5.15.0-142-generic-x86_64-with-glibc2.35
56
- python: CPython 3.10.16
57
- started_at: '2025-07-18T08:38:19.403312Z'
58
- args:
59
- - --save_folder=/mnt/data/zhangjian/a1/libero_spatial_dit_action
60
- - --save_overwrite
61
- program: /home/zhangjian/A1/launch_scripts/train_vla_dit_action.py
62
- code_path: launch_scripts/train_vla_dit_action.py
63
- code_path_local: launch_scripts/train_vla_dit_action.py
64
- git:
65
- remote_url: https://github.com/Spatialtemporal-AI/A1.git
66
- commit: 2e05e206652258f5fbb178ec13c792c2a91c1856
67
- root: /home/zhangjian/A1
68
- host: iv-ydwxzrkf0gvr6okuck21
69
- executable: /mnt/data/zhangjian/miniconda3/envs/a1/bin/python3.10
70
- cpu_count: 56
71
- cpu_count_logical: 112
72
- gpu_type: NVIDIA A100-SXM4-80GB
73
- gpu_count: 8
74
- disk:
75
- /:
76
- total: '507024936960'
77
- used: '133188997120'
78
- memory:
79
- total: '2071488372736'
80
- gpu_nvidia:
81
- - name: NVIDIA A100-SXM4-80GB
82
- memory_total: '85899345920'
83
- cuda_cores: 6912
84
- architecture: Ampere
85
- uuid: GPU-b01b938f-1b95-8587-4b93-cfa68d84c935
86
- - name: NVIDIA A100-SXM4-80GB
87
- memory_total: '85899345920'
88
- cuda_cores: 6912
89
- architecture: Ampere
90
- uuid: GPU-49b283f0-f1e6-992d-4ed8-99855a5e6529
91
- - name: NVIDIA A100-SXM4-80GB
92
- memory_total: '85899345920'
93
- cuda_cores: 6912
94
- architecture: Ampere
95
- uuid: GPU-a340dca6-1db9-f578-76f2-cf36f74ffabd
96
- - name: NVIDIA A100-SXM4-80GB
97
- memory_total: '85899345920'
98
- cuda_cores: 6912
99
- architecture: Ampere
100
- uuid: GPU-c1bddabf-aa88-9c8f-eec2-6dc3e117f985
101
- - name: NVIDIA A100-SXM4-80GB
102
- memory_total: '85899345920'
103
- cuda_cores: 6912
104
- architecture: Ampere
105
- uuid: GPU-4096c1e7-0437-6727-096f-d67141c140b8
106
- - name: NVIDIA A100-SXM4-80GB
107
- memory_total: '85899345920'
108
- cuda_cores: 6912
109
- architecture: Ampere
110
- uuid: GPU-eeb896c0-61d6-8380-778b-d02101078a17
111
- - name: NVIDIA A100-SXM4-80GB
112
- memory_total: '85899345920'
113
- cuda_cores: 6912
114
- architecture: Ampere
115
- uuid: GPU-d5c1ed79-76e3-22a6-8908-df289b090c03
116
- - name: NVIDIA A100-SXM4-80GB
117
- memory_total: '85899345920'
118
- cuda_cores: 6912
119
- architecture: Ampere
120
- uuid: GPU-6d90b060-f6f7-599b-f939-4ba124ff11b7
121
- cuda_version: '12.8'
122
- writer_id: oygl393zcukmmdj0i9c4b0424qwzehyz
123
- text_model_name:
124
- desc: null
125
- value: google/siglip-so400m-patch14-384
126
- vision_model_name:
127
- desc: null
128
- value: google/siglip-so400m-patch14-384
129
- run_name:
130
- desc: null
131
- value: dit_action_train_20250718_163750
132
- save_folder:
133
- desc: null
134
- value: /mnt/data/zhangjian/a1/libero_spatial_dit_action
135
- seed:
136
- desc: null
137
- value: 42
138
- max_steps:
139
- desc: null
140
- value: 100000
141
- global_batch_size:
142
- desc: null
143
- value: 128
144
- device_batch_size:
145
- desc: null
146
- value: 32
147
- learning_rate:
148
- desc: null
149
- value: 2.0e-05
150
- weight_decay:
151
- desc: null
152
- value: 0.01
153
- warmup_steps:
154
- desc: null
155
- value: 500
156
- dataset_name:
157
- desc: null
158
- value: libero_spatial_no_noops
159
- data_root_dir:
160
- desc: null
161
- value: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds
162
- use_wrist_image:
163
- desc: null
164
- value: true
165
- use_proprio:
166
- desc: null
167
- value: true
168
- sequence_length:
169
- desc: null
170
- value: 64
171
- num_workers:
172
- desc: null
173
- value: 0
174
- num_diffusion_steps:
175
- desc: null
176
- value: 1000
177
- num_diffusion_inference_steps:
178
- desc: null
179
- value: 30
180
- lang_cond_dim:
181
- desc: null
182
- value: 1152
183
- img_cond_dim:
184
- desc: null
185
- value: 1152
186
- num_patches:
187
- desc: null
188
- value: 729
189
- dit_hidden_dim:
190
- desc: null
191
- value: 2048
192
- dit_depth:
193
- desc: null
194
- value: 28
195
- dit_num_heads:
196
- desc: null
197
- value: 16
198
- save_interval:
199
- desc: null
200
- value: 1000
201
- eval_interval:
202
- desc: null
203
- value: 500
204
- log_interval:
205
- desc: null
206
- value: 10
207
- save_num_checkpoints_to_keep:
208
- desc: null
209
- value: 3
210
- save_overwrite:
211
- desc: null
212
- value: true
213
- precision:
214
- desc: null
215
- value: amp_bf16
216
- gradient_accumulation_steps:
217
- desc: null
218
- value: 1
219
- max_grad_norm:
220
- desc: null
221
- value: 1.0
222
- wandb_project:
223
- desc: null
224
- value: a1-dit-action-20.47
225
- wandb_entity:
226
- desc: null
227
- value: demo0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_163819-kujhudzv/files/output.log DELETED
@@ -1,160 +0,0 @@
1
- Traceback (most recent call last):
2
- File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 216, in main
3
- trainer.fit()
4
- File "/home/zhangjian/A1/olmo/train.py", line 2798, in fit
5
- metrics = self.train_step(batch)
6
- File "/home/zhangjian/A1/olmo/train.py", line 2735, in train_step
7
- image_embeds = self.vision_model(pixel_values=batch["pixel_values"]).last_hidden_state.detach()
8
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
9
- return self._call_impl(*args, **kwargs)
10
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
11
- return forward_call(*args, **kwargs)
12
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
13
- output = func(self, *args, **kwargs)
14
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 870, in forward
15
- return self.vision_model(
16
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
17
- return self._call_impl(*args, **kwargs)
18
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
19
- return forward_call(*args, **kwargs)
20
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
21
- output = func(self, *args, **kwargs)
22
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 777, in forward
23
- encoder_outputs: BaseModelOutput = self.encoder(
24
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
25
- return self._call_impl(*args, **kwargs)
26
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
27
- return forward_call(*args, **kwargs)
28
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
29
- output = func(self, *args, **kwargs)
30
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 608, in forward
31
- layer_outputs = encoder_layer(
32
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/modeling_layers.py", line 83, in __call__
33
- return super().__call__(*args, **kwargs)
34
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
35
- return self._call_impl(*args, **kwargs)
36
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
37
- return forward_call(*args, **kwargs)
38
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 472, in forward
39
- hidden_states = self.mlp(hidden_states)
40
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
41
- return self._call_impl(*args, **kwargs)
42
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
43
- return forward_call(*args, **kwargs)
44
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 429, in forward
45
- hidden_states = self.fc1(hidden_states)
46
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
47
- return self._call_impl(*args, **kwargs)
48
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
49
- return forward_call(*args, **kwargs)
50
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/linear.py", line 125, in forward
51
- return F.linear(input, self.weight, self.bias)
52
- torch.OutOfMemoryError: CUDA out of memory. Tried to allocate 768.00 MiB. GPU 0 has a total capacity of 79.44 GiB of which 441.00 MiB is free. Including non-PyTorch memory, this process has 79.00 GiB memory in use. Of the allocated memory 77.89 GiB is allocated by PyTorch, and 630.78 MiB is reserved by PyTorch but unallocated. If reserved but unallocated memory is large try setting PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True to avoid fragmentation. See documentation for Memory Management (https://pytorch.org/docs/stable/notes/cuda.html#environment-variables)
53
- Traceback (most recent call last):
54
- File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 236, in <module>
55
- main()
56
- File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 216, in main
57
- trainer.fit()
58
- File "/home/zhangjian/A1/olmo/train.py", line 2798, in fit
59
- metrics = self.train_step(batch)
60
- File "/home/zhangjian/A1/olmo/train.py", line 2735, in train_step
61
- image_embeds = self.vision_model(pixel_values=batch["pixel_values"]).last_hidden_state.detach()
62
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
63
- return self._call_impl(*args, **kwargs)
64
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
65
- return forward_call(*args, **kwargs)
66
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
67
- output = func(self, *args, **kwargs)
68
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 870, in forward
69
- return self.vision_model(
70
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
71
- return self._call_impl(*args, **kwargs)
72
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
73
- return forward_call(*args, **kwargs)
74
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
75
- output = func(self, *args, **kwargs)
76
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 777, in forward
77
- encoder_outputs: BaseModelOutput = self.encoder(
78
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
79
- return self._call_impl(*args, **kwargs)
80
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
81
- return forward_call(*args, **kwargs)
82
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
83
- output = func(self, *args, **kwargs)
84
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 608, in forward
85
- layer_outputs = encoder_layer(
86
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/modeling_layers.py", line 83, in __call__
87
- return super().__call__(*args, **kwargs)
88
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
89
- return self._call_impl(*args, **kwargs)
90
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
91
- return forward_call(*args, **kwargs)
92
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 472, in forward
93
- hidden_states = self.mlp(hidden_states)
94
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
95
- return self._call_impl(*args, **kwargs)
96
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
97
- return forward_call(*args, **kwargs)
98
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 429, in forward
99
- hidden_states = self.fc1(hidden_states)
100
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
101
- return self._call_impl(*args, **kwargs)
102
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
103
- return forward_call(*args, **kwargs)
104
- File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/linear.py", line 125, in forward
105
- return F.linear(input, self.weight, self.bias)
106
- torch.OutOfMemoryError: CUDA out of memory. Tried to allocate 768.00 MiB. GPU 0 has a total capacity of 79.44 GiB of which 441.00 MiB is free. Including non-PyTorch memory, this process has 79.00 GiB memory in use. Of the allocated memory 77.89 GiB is allocated by PyTorch, and 630.78 MiB is reserved by PyTorch but unallocated. If reserved but unallocated memory is large try setting PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True to avoid fragmentation. See documentation for Memory Management (https://pytorch.org/docs/stable/notes/cuda.html#environment-variables)
107
- [rank0]: Traceback (most recent call last):
108
- [rank0]: File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 236, in <module>
109
- [rank0]: main()
110
- [rank0]: File "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", line 216, in main
111
- [rank0]: trainer.fit()
112
- [rank0]: File "/home/zhangjian/A1/olmo/train.py", line 2798, in fit
113
- [rank0]: metrics = self.train_step(batch)
114
- [rank0]: File "/home/zhangjian/A1/olmo/train.py", line 2735, in train_step
115
- [rank0]: image_embeds = self.vision_model(pixel_values=batch["pixel_values"]).last_hidden_state.detach()
116
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
117
- [rank0]: return self._call_impl(*args, **kwargs)
118
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
119
- [rank0]: return forward_call(*args, **kwargs)
120
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
121
- [rank0]: output = func(self, *args, **kwargs)
122
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 870, in forward
123
- [rank0]: return self.vision_model(
124
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
125
- [rank0]: return self._call_impl(*args, **kwargs)
126
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
127
- [rank0]: return forward_call(*args, **kwargs)
128
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
129
- [rank0]: output = func(self, *args, **kwargs)
130
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 777, in forward
131
- [rank0]: encoder_outputs: BaseModelOutput = self.encoder(
132
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
133
- [rank0]: return self._call_impl(*args, **kwargs)
134
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
135
- [rank0]: return forward_call(*args, **kwargs)
136
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/utils/generic.py", line 943, in wrapper
137
- [rank0]: output = func(self, *args, **kwargs)
138
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 608, in forward
139
- [rank0]: layer_outputs = encoder_layer(
140
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/modeling_layers.py", line 83, in __call__
141
- [rank0]: return super().__call__(*args, **kwargs)
142
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
143
- [rank0]: return self._call_impl(*args, **kwargs)
144
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
145
- [rank0]: return forward_call(*args, **kwargs)
146
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 472, in forward
147
- [rank0]: hidden_states = self.mlp(hidden_states)
148
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
149
- [rank0]: return self._call_impl(*args, **kwargs)
150
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
151
- [rank0]: return forward_call(*args, **kwargs)
152
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/transformers/models/siglip/modeling_siglip.py", line 429, in forward
153
- [rank0]: hidden_states = self.fc1(hidden_states)
154
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1751, in _wrapped_call_impl
155
- [rank0]: return self._call_impl(*args, **kwargs)
156
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1762, in _call_impl
157
- [rank0]: return forward_call(*args, **kwargs)
158
- [rank0]: File "/mnt/data/zhangjian/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/linear.py", line 125, in forward
159
- [rank0]: return F.linear(input, self.weight, self.bias)
160
- [rank0]: torch.OutOfMemoryError: CUDA out of memory. Tried to allocate 768.00 MiB. GPU 0 has a total capacity of 79.44 GiB of which 441.00 MiB is free. Including non-PyTorch memory, this process has 79.00 GiB memory in use. Of the allocated memory 77.89 GiB is allocated by PyTorch, and 630.78 MiB is reserved by PyTorch but unallocated. If reserved but unallocated memory is large try setting PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True to avoid fragmentation. See documentation for Memory Management (https://pytorch.org/docs/stable/notes/cuda.html#environment-variables)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_163819-kujhudzv/files/requirements.txt DELETED
@@ -1,262 +0,0 @@
1
- ai2-molmo==0.0.0
2
- yarl==1.20.1
3
- astunparse==1.6.3
4
- nvidia-cudnn-cu12==9.5.1.17
5
- etils==1.13.0
6
- tensorflow-io-gcs-filesystem==0.37.1
7
- Brotli==1.1.0
8
- gcsfs==2023.9.2
9
- multiprocess==0.70.16
10
- packaging==25.0
11
- idna==3.10
12
- absl-py==2.3.1
13
- id==1.5.0
14
- einops==0.8.1
15
- rich==13.9.4
16
- editdistance==0.8.1
17
- trouting==0.3.3
18
- mypy==1.3.0
19
- distro==1.9.0
20
- cycler==0.12.1
21
- s3transfer==0.13.0
22
- pyarrow==20.0.0
23
- sentry-sdk==2.33.0
24
- toml==0.10.2
25
- GitPython==3.1.44
26
- click==8.2.1
27
- ai2-molmo==0.0.0
28
- tensorflow-datasets==4.9.9
29
- tqdm==4.67.1
30
- safetensors==0.5.3
31
- google-auth==2.40.3
32
- iniconfig==2.1.0
33
- smmap==5.0.2
34
- nvidia-cublas-cu12==12.6.4.1
35
- wheel==0.45.1
36
- pluggy==1.6.0
37
- filelock==3.18.0
38
- google-auth-oauthlib==1.2.2
39
- httpx==0.28.1
40
- pyasn1==0.6.1
41
- typing-inspection==0.4.1
42
- pydub==0.25.1
43
- nvidia-cusparselt-cu12==0.6.3
44
- decorator==5.2.1
45
- frozenlist==1.7.0
46
- backports.tarfile==1.2.0
47
- setuptools==78.1.1
48
- keras==2.15.0
49
- MarkupSafe==3.0.2
50
- libclang==18.1.1
51
- necessary==0.4.3
52
- cached_path==1.7.3
53
- Jinja2==3.1.6
54
- beaker-py==2.4.6
55
- requests-toolbelt==1.0.0
56
- contourpy==1.3.2
57
- python-multipart==0.0.20
58
- nvidia-cusolver-cu12==11.7.1.2
59
- sentencepiece==0.2.0
60
- cffi==1.17.1
61
- gast==0.6.0
62
- nvidia-curand-cu12==10.3.7.77
63
- six==1.17.0
64
- boto3==1.39.5
65
- annotated-types==0.7.0
66
- termcolor==3.1.0
67
- pyparsing==3.2.3
68
- pydantic_core==2.33.2
69
- rfc3986==2.0.0
70
- pydantic==2.11.7
71
- jiter==0.10.0
72
- jaraco.context==6.0.1
73
- importlib_resources==6.5.2
74
- typeguard==2.13.3
75
- nltk==3.9.1
76
- opt_einsum==3.4.0
77
- grpcio==1.73.1
78
- pathspec==0.12.1
79
- triton==3.3.1
80
- gradio==5.37.0
81
- nvidia-nccl-cu12==2.26.2
82
- smart_open==7.3.0.post1
83
- scikit-learn==1.7.0
84
- pytest-sphinx==0.6.3
85
- google-cloud-core==2.4.3
86
- rsa==4.9.1
87
- readme_renderer==44.0
88
- httpcore==1.0.9
89
- threadpoolctl==3.6.0
90
- fsspec==2023.9.2
91
- keyring==25.6.0
92
- aiohttp==3.12.14
93
- attrs==25.3.0
94
- mypy_extensions==1.1.0
95
- antlr4-python3-runtime==4.9.3
96
- orjson==3.11.0
97
- cachetools==5.5.2
98
- requests==2.32.4
99
- smashed==0.21.5
100
- nvidia-cuda-cupti-cu12==12.6.80
101
- aiosignal==1.4.0
102
- torch==2.7.1
103
- xxhash==3.5.0
104
- OpenEXR==3.3.4
105
- cached-property==2.0.1
106
- wcwidth==0.2.13
107
- uvicorn==0.35.0
108
- numpy==1.26.4
109
- flatbuffers==25.2.10
110
- torchmetrics==1.7.4
111
- ftfy==6.3.1
112
- dill==0.3.8
113
- multidict==6.6.3
114
- shellingham==1.5.4
115
- promise==2.3
116
- anyio==4.9.0
117
- regex==2024.11.6
118
- tensorflow-graphics==2021.12.3
119
- pycparser==2.22
120
- nvidia-cuda-runtime-cu12==12.6.77
121
- matplotlib==3.10.3
122
- google-cloud-storage==2.19.0
123
- botocore==1.39.5
124
- click-option-group==0.5.7
125
- pytz==2025.2
126
- fonttools==4.58.5
127
- pyproject_hooks==1.2.0
128
- google-crc32c==1.7.1
129
- Markdown==3.8.2
130
- requests-oauthlib==2.0.0
131
- dlimp==0.0.1
132
- nvidia-cuda-nvrtc-cu12==12.6.77
133
- tomlkit==0.13.3
134
- safehttpx==0.1.6
135
- nvidia-cufft-cu12==11.3.0.4
136
- jmespath==1.0.1
137
- protobuf==4.21.12
138
- nvidia-nvtx-cu12==12.6.77
139
- tensorflow-addons==0.23.0
140
- jaraco.classes==3.4.0
141
- aiofiles==24.1.0
142
- exceptiongroup==1.3.0
143
- libcst==1.8.2
144
- immutabledict==4.2.1
145
- oauthlib==3.3.1
146
- timm==1.0.16
147
- lightning-utilities==0.14.3
148
- jeepney==0.9.0
149
- certifi==2025.7.14
150
- docutils==0.21.2
151
- markdown-it-py==3.0.0
152
- proto-plus==1.26.1
153
- wrapt==1.14.1
154
- mdurl==0.1.2
155
- more-itertools==10.7.0
156
- platformdirs==4.3.8
157
- kiwisolver==1.4.8
158
- tensorboard-data-server==0.7.2
159
- propcache==0.3.2
160
- zipp==3.23.0
161
- Werkzeug==3.1.3
162
- wandb==0.21.0
163
- Levenshtein==0.27.1
164
- isort==5.12.0
165
- simple-parsing==0.1.7
166
- face==24.0.0
167
- tzdata==2025.2
168
- h5py==3.14.0
169
- psutil==7.0.0
170
- mpmath==1.3.0
171
- dm-tree==0.1.9
172
- tensorflow-estimator==2.15.0
173
- pip==25.1
174
- joblib==1.5.1
175
- pyasn1_modules==0.4.2
176
- RapidFuzz==3.13.0
177
- cryptography==45.0.5
178
- typing_extensions==4.14.1
179
- urllib3==2.5.0
180
- sniffio==1.3.1
181
- omegaconf==2.3.0
182
- h11==0.16.0
183
- nvidia-cusparse-cu12==12.5.4.2
184
- click-help-colors==0.9.4
185
- einops-exts==0.0.4
186
- scipy==1.15.3
187
- nvidia-cufile-cu12==1.11.1.6
188
- huggingface-hub==0.33.4
189
- PyYAML==6.0.2
190
- pandas==2.3.1
191
- python-dateutil==2.9.0.post0
192
- petname==2.6
193
- tensorboard==2.15.2
194
- python-Levenshtein==0.27.1
195
- graphviz==0.21
196
- datasets==4.0.0
197
- gradio_client==1.10.4
198
- networkx==3.4.2
199
- nh3==0.2.22
200
- jaraco.functools==4.2.1
201
- ml-dtypes==0.2.0
202
- gitdb==4.0.12
203
- google-pasta==0.2.0
204
- openai==1.96.1
205
- aiohappyeyeballs==2.6.1
206
- docstring_parser==0.16
207
- build==1.2.2.post1
208
- tokenizers==0.21.2
209
- black==23.12.1
210
- fiddle==0.3.0
211
- requirements-parser==0.13.0
212
- ruff==0.12.3
213
- trimesh==4.7.0
214
- Pygments==2.19.2
215
- google-resumable-media==2.7.2
216
- async-timeout==5.0.1
217
- hf-xet==1.1.5
218
- groovy==0.1.2
219
- accelerate==1.8.1
220
- diffusers==0.33.1
221
- SecretStorage==3.3.3
222
- ffmpy==0.6.0
223
- websockets==15.0.1
224
- fastapi==0.116.1
225
- importlib_metadata==8.7.0
226
- pillow==11.3.0
227
- nvidia-nvjitlink-cu12==12.6.85
228
- beaker-gantry==2.8.3
229
- glom==24.11.0
230
- transformers==4.53.2
231
- pytest==8.4.1
232
- tensorflow==2.15.0
233
- semantic-version==2.10.0
234
- charset-normalizer==3.4.2
235
- tensorflow-metadata==1.17.2
236
- googleapis-common-protos==1.70.0
237
- boltons==25.0.0
238
- twine==6.1.0
239
- tomli==2.2.1
240
- google-api-core==2.25.1
241
- typer==0.16.0
242
- sympy==1.14.0
243
- starlette==0.47.1
244
- msgspec==0.19.0
245
- array_record==0.7.2
246
- torchvision==0.22.1
247
- typing_extensions==4.12.2
248
- wheel==0.45.1
249
- backports.tarfile==1.2.0
250
- inflect==7.3.1
251
- zipp==3.19.2
252
- jaraco.collections==5.1.0
253
- jaraco.text==3.12.1
254
- jaraco.context==5.3.0
255
- jaraco.functools==4.0.1
256
- tomli==2.0.1
257
- platformdirs==4.2.2
258
- packaging==24.2
259
- typeguard==4.3.0
260
- importlib_metadata==8.0.0
261
- more-itertools==10.3.0
262
- autocommand==2.2.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_163819-kujhudzv/files/wandb-metadata.json DELETED
@@ -1 +0,0 @@
1
- {"os": "Linux-5.15.0-142-generic-x86_64-with-glibc2.35", "python": "CPython 3.10.16", "started_at": "2025-07-18T08:38:19.403312Z", "args": ["--save_folder=/mnt/data/zhangjian/a1/libero_spatial_dit_action", "--save_overwrite"], "program": "/home/zhangjian/A1/launch_scripts/train_vla_dit_action.py", "code_path": "launch_scripts/train_vla_dit_action.py", "code_path_local": "launch_scripts/train_vla_dit_action.py", "git": {"remote_url": "https://github.com/Spatialtemporal-AI/A1.git", "commit": "2e05e206652258f5fbb178ec13c792c2a91c1856"}, "root": "/home/zhangjian/A1", "host": "iv-ydwxzrkf0gvr6okuck21", "executable": "/mnt/data/zhangjian/miniconda3/envs/a1/bin/python3.10", "cpu_count": 56, "cpu_count_logical": 112, "gpu_type": "NVIDIA A100-SXM4-80GB", "gpu_count": 8, "disk": {"/": {"total": "507024936960", "used": "133188997120"}}, "memory": {"total": "2071488372736"}, "gpu_nvidia": [{"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-b01b938f-1b95-8587-4b93-cfa68d84c935"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-49b283f0-f1e6-992d-4ed8-99855a5e6529"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-a340dca6-1db9-f578-76f2-cf36f74ffabd"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-c1bddabf-aa88-9c8f-eec2-6dc3e117f985"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-4096c1e7-0437-6727-096f-d67141c140b8"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-eeb896c0-61d6-8380-778b-d02101078a17"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-d5c1ed79-76e3-22a6-8908-df289b090c03"}, {"name": "NVIDIA A100-SXM4-80GB", "memory_total": "85899345920", "cuda_cores": 6912, "architecture": "Ampere", "uuid": "GPU-6d90b060-f6f7-599b-f939-4ba124ff11b7"}], "cuda_version": "12.8", "writer_id": "oygl393zcukmmdj0i9c4b0424qwzehyz"}
 
 
wandb/offline-run-20250718_163819-kujhudzv/files/wandb-summary.json DELETED
@@ -1 +0,0 @@
1
- {"_runtime": 9}
 
 
wandb/offline-run-20250718_163819-kujhudzv/logs/debug-core.log DELETED
@@ -1,14 +0,0 @@
1
- {"time":"2025-07-18T16:38:19.433873148+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpptx2rkja/port-2907721.txt","pid":2907721,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
- {"time":"2025-07-18T16:38:19.434389567+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":2907721}
3
- {"time":"2025-07-18T16:38:19.434364202+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2907721-2910040-479139429/socket","Net":"unix"}}
4
- {"time":"2025-07-18T16:38:19.611743485+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
- {"time":"2025-07-18T16:38:19.616099563+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"kujhudzv","id":"1(@)"}
6
- {"time":"2025-07-18T16:38:19.735468949+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"kujhudzv","id":"1(@)"}
7
- {"time":"2025-07-18T16:38:28.751051088+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
- {"time":"2025-07-18T16:38:28.751139005+08:00","level":"INFO","msg":"server is shutting down"}
9
- {"time":"2025-07-18T16:38:28.751126778+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
- {"time":"2025-07-18T16:38:28.751218178+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
11
- {"time":"2025-07-18T16:38:28.751229032+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2907721-2910040-479139429/socket","Net":"unix"}}
12
- {"time":"2025-07-18T16:38:28.753347379+08:00","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
13
- {"time":"2025-07-18T16:38:28.753373097+08:00","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
14
- {"time":"2025-07-18T16:38:28.753384353+08:00","level":"INFO","msg":"server is closed"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_163819-kujhudzv/logs/debug-internal.log DELETED
@@ -1,13 +0,0 @@
1
- {"time":"2025-07-18T16:38:19.620235579+08:00","level":"INFO","msg":"stream: starting","core version":"0.21.0"}
2
- {"time":"2025-07-18T16:38:19.735259373+08:00","level":"WARN","msg":"GraphQL client is nil, skipping feature loading"}
3
- {"time":"2025-07-18T16:38:19.735439442+08:00","level":"INFO","msg":"stream: created new stream","id":"kujhudzv"}
4
- {"time":"2025-07-18T16:38:19.735463779+08:00","level":"INFO","msg":"stream: started","id":"kujhudzv"}
5
- {"time":"2025-07-18T16:38:19.735487143+08:00","level":"INFO","msg":"writer: Do: started","stream_id":"kujhudzv"}
6
- {"time":"2025-07-18T16:38:19.7355104+08:00","level":"INFO","msg":"sender: started","stream_id":"kujhudzv"}
7
- {"time":"2025-07-18T16:38:19.735512981+08:00","level":"INFO","msg":"handler: started","stream_id":"kujhudzv"}
8
- {"time":"2025-07-18T16:38:19.737472829+08:00","level":"WARN","msg":"runupserter: server does not expand metric globs but the x_server_side_expand_glob_metrics setting is set; ignoring"}
9
- {"time":"2025-07-18T16:38:28.75123625+08:00","level":"INFO","msg":"stream: closing","id":"kujhudzv"}
10
- {"time":"2025-07-18T16:38:28.751382942+08:00","level":"INFO","msg":"handler: closed","stream_id":"kujhudzv"}
11
- {"time":"2025-07-18T16:38:28.751390848+08:00","level":"INFO","msg":"writer: Close: closed","stream_id":"kujhudzv"}
12
- {"time":"2025-07-18T16:38:28.751399279+08:00","level":"INFO","msg":"sender: closed","stream_id":"kujhudzv"}
13
- {"time":"2025-07-18T16:38:28.751516927+08:00","level":"INFO","msg":"stream: closed","id":"kujhudzv"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
wandb/offline-run-20250718_163819-kujhudzv/logs/debug.log DELETED
File without changes
wandb/offline-run-20250718_163819-kujhudzv/run-kujhudzv.wandb DELETED
Binary file (24 kB)
 
wandb/offline-run-20250718_163819-kujhudzv/run-kujhudzv.wandb.synced DELETED
File without changes
wandb/offline-run-20250718_164033-dnuid9t7/files/output.log DELETED
File without changes
wandb/offline-run-20250718_164033-dnuid9t7/files/requirements.txt DELETED
@@ -1,262 +0,0 @@
1
- ai2-molmo==0.0.0
2
- yarl==1.20.1
3
- astunparse==1.6.3
4
- nvidia-cudnn-cu12==9.5.1.17
5
- etils==1.13.0
6
- tensorflow-io-gcs-filesystem==0.37.1
7
- Brotli==1.1.0
8
- gcsfs==2023.9.2
9
- multiprocess==0.70.16
10
- packaging==25.0
11
- idna==3.10
12
- absl-py==2.3.1
13
- id==1.5.0
14
- einops==0.8.1
15
- rich==13.9.4
16
- editdistance==0.8.1
17
- trouting==0.3.3
18
- mypy==1.3.0
19
- distro==1.9.0
20
- cycler==0.12.1
21
- s3transfer==0.13.0
22
- pyarrow==20.0.0
23
- sentry-sdk==2.33.0
24
- toml==0.10.2
25
- GitPython==3.1.44
26
- click==8.2.1
27
- ai2-molmo==0.0.0
28
- tensorflow-datasets==4.9.9
29
- tqdm==4.67.1
30
- safetensors==0.5.3
31
- google-auth==2.40.3
32
- iniconfig==2.1.0
33
- smmap==5.0.2
34
- nvidia-cublas-cu12==12.6.4.1
35
- wheel==0.45.1
36
- pluggy==1.6.0
37
- filelock==3.18.0
38
- google-auth-oauthlib==1.2.2
39
- httpx==0.28.1
40
- pyasn1==0.6.1
41
- typing-inspection==0.4.1
42
- pydub==0.25.1
43
- nvidia-cusparselt-cu12==0.6.3
44
- decorator==5.2.1
45
- frozenlist==1.7.0
46
- backports.tarfile==1.2.0
47
- setuptools==78.1.1
48
- keras==2.15.0
49
- MarkupSafe==3.0.2
50
- libclang==18.1.1
51
- necessary==0.4.3
52
- cached_path==1.7.3
53
- Jinja2==3.1.6
54
- beaker-py==2.4.6
55
- requests-toolbelt==1.0.0
56
- contourpy==1.3.2
57
- python-multipart==0.0.20
58
- nvidia-cusolver-cu12==11.7.1.2
59
- sentencepiece==0.2.0
60
- cffi==1.17.1
61
- gast==0.6.0
62
- nvidia-curand-cu12==10.3.7.77
63
- six==1.17.0
64
- boto3==1.39.5
65
- annotated-types==0.7.0
66
- termcolor==3.1.0
67
- pyparsing==3.2.3
68
- pydantic_core==2.33.2
69
- rfc3986==2.0.0
70
- pydantic==2.11.7
71
- jiter==0.10.0
72
- jaraco.context==6.0.1
73
- importlib_resources==6.5.2
74
- typeguard==2.13.3
75
- nltk==3.9.1
76
- opt_einsum==3.4.0
77
- grpcio==1.73.1
78
- pathspec==0.12.1
79
- triton==3.3.1
80
- gradio==5.37.0
81
- nvidia-nccl-cu12==2.26.2
82
- smart_open==7.3.0.post1
83
- scikit-learn==1.7.0
84
- pytest-sphinx==0.6.3
85
- google-cloud-core==2.4.3
86
- rsa==4.9.1
87
- readme_renderer==44.0
88
- httpcore==1.0.9
89
- threadpoolctl==3.6.0
90
- fsspec==2023.9.2
91
- keyring==25.6.0
92
- aiohttp==3.12.14
93
- attrs==25.3.0
94
- mypy_extensions==1.1.0
95
- antlr4-python3-runtime==4.9.3
96
- orjson==3.11.0
97
- cachetools==5.5.2
98
- requests==2.32.4
99
- smashed==0.21.5
100
- nvidia-cuda-cupti-cu12==12.6.80
101
- aiosignal==1.4.0
102
- torch==2.7.1
103
- xxhash==3.5.0
104
- OpenEXR==3.3.4
105
- cached-property==2.0.1
106
- wcwidth==0.2.13
107
- uvicorn==0.35.0
108
- numpy==1.26.4
109
- flatbuffers==25.2.10
110
- torchmetrics==1.7.4
111
- ftfy==6.3.1
112
- dill==0.3.8
113
- multidict==6.6.3
114
- shellingham==1.5.4
115
- promise==2.3
116
- anyio==4.9.0
117
- regex==2024.11.6
118
- tensorflow-graphics==2021.12.3
119
- pycparser==2.22
120
- nvidia-cuda-runtime-cu12==12.6.77
121
- matplotlib==3.10.3
122
- google-cloud-storage==2.19.0
123
- botocore==1.39.5
124
- click-option-group==0.5.7
125
- pytz==2025.2
126
- fonttools==4.58.5
127
- pyproject_hooks==1.2.0
128
- google-crc32c==1.7.1
129
- Markdown==3.8.2
130
- requests-oauthlib==2.0.0
131
- dlimp==0.0.1
132
- nvidia-cuda-nvrtc-cu12==12.6.77
133
- tomlkit==0.13.3
134
- safehttpx==0.1.6
135
- nvidia-cufft-cu12==11.3.0.4
136
- jmespath==1.0.1
137
- protobuf==4.21.12
138
- nvidia-nvtx-cu12==12.6.77
139
- tensorflow-addons==0.23.0
140
- jaraco.classes==3.4.0
141
- aiofiles==24.1.0
142
- exceptiongroup==1.3.0
143
- libcst==1.8.2
144
- immutabledict==4.2.1
145
- oauthlib==3.3.1
146
- timm==1.0.16
147
- lightning-utilities==0.14.3
148
- jeepney==0.9.0
149
- certifi==2025.7.14
150
- docutils==0.21.2
151
- markdown-it-py==3.0.0
152
- proto-plus==1.26.1
153
- wrapt==1.14.1
154
- mdurl==0.1.2
155
- more-itertools==10.7.0
156
- platformdirs==4.3.8
157
- kiwisolver==1.4.8
158
- tensorboard-data-server==0.7.2
159
- propcache==0.3.2
160
- zipp==3.23.0
161
- Werkzeug==3.1.3
162
- wandb==0.21.0
163
- Levenshtein==0.27.1
164
- isort==5.12.0
165
- simple-parsing==0.1.7
166
- face==24.0.0
167
- tzdata==2025.2
168
- h5py==3.14.0
169
- psutil==7.0.0
170
- mpmath==1.3.0
171
- dm-tree==0.1.9
172
- tensorflow-estimator==2.15.0
173
- pip==25.1
174
- joblib==1.5.1
175
- pyasn1_modules==0.4.2
176
- RapidFuzz==3.13.0
177
- cryptography==45.0.5
178
- typing_extensions==4.14.1
179
- urllib3==2.5.0
180
- sniffio==1.3.1
181
- omegaconf==2.3.0
182
- h11==0.16.0
183
- nvidia-cusparse-cu12==12.5.4.2
184
- click-help-colors==0.9.4
185
- einops-exts==0.0.4
186
- scipy==1.15.3
187
- nvidia-cufile-cu12==1.11.1.6
188
- huggingface-hub==0.33.4
189
- PyYAML==6.0.2
190
- pandas==2.3.1
191
- python-dateutil==2.9.0.post0
192
- petname==2.6
193
- tensorboard==2.15.2
194
- python-Levenshtein==0.27.1
195
- graphviz==0.21
196
- datasets==4.0.0
197
- gradio_client==1.10.4
198
- networkx==3.4.2
199
- nh3==0.2.22
200
- jaraco.functools==4.2.1
201
- ml-dtypes==0.2.0
202
- gitdb==4.0.12
203
- google-pasta==0.2.0
204
- openai==1.96.1
205
- aiohappyeyeballs==2.6.1
206
- docstring_parser==0.16
207
- build==1.2.2.post1
208
- tokenizers==0.21.2
209
- black==23.12.1
210
- fiddle==0.3.0
211
- requirements-parser==0.13.0
212
- ruff==0.12.3
213
- trimesh==4.7.0
214
- Pygments==2.19.2
215
- google-resumable-media==2.7.2
216
- async-timeout==5.0.1
217
- hf-xet==1.1.5
218
- groovy==0.1.2
219
- accelerate==1.8.1
220
- diffusers==0.33.1
221
- SecretStorage==3.3.3
222
- ffmpy==0.6.0
223
- websockets==15.0.1
224
- fastapi==0.116.1
225
- importlib_metadata==8.7.0
226
- pillow==11.3.0
227
- nvidia-nvjitlink-cu12==12.6.85
228
- beaker-gantry==2.8.3
229
- glom==24.11.0
230
- transformers==4.53.2
231
- pytest==8.4.1
232
- tensorflow==2.15.0
233
- semantic-version==2.10.0
234
- charset-normalizer==3.4.2
235
- tensorflow-metadata==1.17.2
236
- googleapis-common-protos==1.70.0
237
- boltons==25.0.0
238
- twine==6.1.0
239
- tomli==2.2.1
240
- google-api-core==2.25.1
241
- typer==0.16.0
242
- sympy==1.14.0
243
- starlette==0.47.1
244
- msgspec==0.19.0
245
- array_record==0.7.2
246
- torchvision==0.22.1
247
- typing_extensions==4.12.2
248
- wheel==0.45.1
249
- backports.tarfile==1.2.0
250
- inflect==7.3.1
251
- zipp==3.19.2
252
- jaraco.collections==5.1.0
253
- jaraco.text==3.12.1
254
- jaraco.context==5.3.0
255
- jaraco.functools==4.0.1
256
- tomli==2.0.1
257
- platformdirs==4.2.2
258
- packaging==24.2
259
- typeguard==4.3.0
260
- importlib_metadata==8.0.0
261
- more-itertools==10.3.0
262
- autocommand==2.2.2