Upload GR00T_N1_5 checkpoint 20000 for OpenWBC bottle task

Files changed (14) hide show

experiment_cfg/conf.yaml CHANGED Viewed

@@ -65,7 +65,7 @@ model:
 data:
   datasets:
   - dataset_paths:
-    - /home/opuser/wtx/vla/data/new/onlybottom_gr00t
     embodiment_tag: new_embodiment
     mix_ratio: 1.0
     dataset_type: physical_embodiment
@@ -187,9 +187,9 @@ data:
   - 224
   video_backend: torchcodec
 training:
-  output_dir: ./save/test1
   experiment_name: null
-  max_steps: 20000
   global_batch_size: 96
   batch_size: null
   gradient_accumulation_steps: 1
@@ -200,13 +200,13 @@ training:
   warmup_steps: 0
   max_grad_norm: 1.0
   optim: adamw_torch
-  start_from_checkpoint: ../models/GR00T-N1.6-G1-PnPAppleToPlate/
   tf32: true
   fp16: false
   bf16: true
   eval_bf16: true
   logging_steps: 10
-  save_steps: 1000
   save_total_limit: 5
   save_vl_model: false
   upload_checkpoints: false
@@ -241,5 +241,5 @@ training:
   - 0
   open_loop_eval_steps_per_traj: 100
   open_loop_eval_plot_indices: null
-max_steps: 20000
-save_steps: 1000

 data:
   datasets:
   - dataset_paths:
+    - /home/opuser/wtx/vla/data/gr00t/new/onlybottom_gr00t
     embodiment_tag: new_embodiment
     mix_ratio: 1.0
     dataset_type: physical_embodiment
   - 224
   video_backend: torchcodec
 training:
+  output_dir: ./save/test6000
   experiment_name: null
+  max_steps: 60000
   global_batch_size: 96
   batch_size: null
   gradient_accumulation_steps: 1
   warmup_steps: 0
   max_grad_norm: 1.0
   optim: adamw_torch
+  start_from_checkpoint: /home/opuser/wtx/vla/models/GR00T-N1.6-G1-PnPAppleToPlate
   tf32: true
   fp16: false
   bf16: true
   eval_bf16: true
   logging_steps: 10
+  save_steps: 5000
   save_total_limit: 5
   save_vl_model: false
   upload_checkpoints: false
   - 0
   open_loop_eval_steps_per_traj: 100
   open_loop_eval_plot_indices: null
+max_steps: 60000
+save_steps: 5000

experiment_cfg/config.yaml CHANGED Viewed

@@ -4,7 +4,7 @@ data: !!python/object:gr00t.configs.data.data_config.DataConfig
   datasets:
   - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
     dataset_paths:
-    - /home/opuser/wtx/vla/data/new/onlybottom_gr00t
     dataset_type: physical_embodiment
     embodiment_tag: new_embodiment
     mix_ratio: 1.0
@@ -253,21 +253,21 @@ training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
   max_concurrent_uploads: 2
   max_grad_norm: 1.0
   max_retries: 3
-  max_steps: 20000
   num_gpus: 2
   open_loop_eval_plot_indices: null
   open_loop_eval_steps_per_traj: 100
   open_loop_eval_traj_ids:
   - 0
   optim: adamw_torch
-  output_dir: ./save/test1
   remove_unused_columns: false
   save_best_eval_metric_greater_is_better: true
   save_best_eval_metric_name: ''
-  save_steps: 1000
   save_total_limit: 5
   save_vl_model: false
-  start_from_checkpoint: ../models/GR00T-N1.6-G1-PnPAppleToPlate/
   tf32: true
   transformers_access_token: null
   transformers_cache_dir: null

   datasets:
   - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
     dataset_paths:
+    - /home/opuser/wtx/vla/data/gr00t/new/onlybottom_gr00t
     dataset_type: physical_embodiment
     embodiment_tag: new_embodiment
     mix_ratio: 1.0
   max_concurrent_uploads: 2
   max_grad_norm: 1.0
   max_retries: 3
+  max_steps: 60000
   num_gpus: 2
   open_loop_eval_plot_indices: null
   open_loop_eval_steps_per_traj: 100
   open_loop_eval_traj_ids:
   - 0
   optim: adamw_torch
+  output_dir: ./save/test6000
   remove_unused_columns: false
   save_best_eval_metric_greater_is_better: true
   save_best_eval_metric_name: ''
+  save_steps: 5000
   save_total_limit: 5
   save_vl_model: false
+  start_from_checkpoint: /home/opuser/wtx/vla/models/GR00T-N1.6-G1-PnPAppleToPlate
   tf32: true
   transformers_access_token: null
   transformers_cache_dir: null

global_step60000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:63d230f64928175c6af4f17e0412783538ab366382fa6058eaa6bdcd6dcf3c5c
+size 9719841825

global_step60000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef845a54f74aca7e7d730957939008f393d7db61e49a03e3c44b4cdb33bae64a
+size 9719835873

global_step60000/mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0981877d4d94ba5df862920ecd3eb841288114e4888b7fea1581331af8fb103
+size 9907202435

latest CHANGED Viewed

	@@ -1 +1 @@
1	- ~~global_step20000~~


1	+ global_step60000

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a229a9f6dedeaee028cd1b60f4f8e1f938836efb98d39b422f4c5ad8c665b02b
 size 4991091456

 version https://git-lfs.github.com/spec/v1
+oid sha256:cf5bae92cdb4e52d89fb76282f84cb0c1aa811ef4252c6261bcf3a8ae5b71e9a
 size 4991091456

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af1879144a86a457d2603f333003a55a59e9b0d5906143828728afcf75d6380f
 size 1582283096

 version https://git-lfs.github.com/spec/v1
+oid sha256:e5153e1d8be1ea2726732c057906ddcf3309f6ac5a0236d2a6b839696b5b1975
 size 1582283096

rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a2d386a33a3a3e726b5af06a1adef33f3da8e695771b1410c8be86d10f29b3b
 size 14917

 version https://git-lfs.github.com/spec/v1
+oid sha256:8a1258e46605de576a62034dd10ba29c0a34e9a8238cf43f02aedbc426594eac
 size 14917

rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e4d3c79f81b9d18e67f3cc1809d5633c90ae75a4916c495e3f9cb6a8f5483ace
 size 14917

 version https://git-lfs.github.com/spec/v1
+oid sha256:26b5993f4cffa03a121b1ee1670a40a77f949b7a4e76e5102ab72e91290e8f59
 size 14917

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7fa802a80def971b73ec74284a6aa44d0b2ea101bd38ed41a3b1c1a0b4001f00
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:96b418fbb509f96d95ad52dd99d48eeb782a306175bb55d2661eb9b3585613ba
 size 1465

trainer_state.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6270b2f9a0a7d10b725ab54b19d53553b72c7707af49e677cf873b583dc2b4d1
 size 7633

 version https://git-lfs.github.com/spec/v1
+oid sha256:560a23fc414112b4ca651369d3d4ebef45c1454b966cb7683543d996709746be
 size 7633

wandb_config.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"project": "finetune-gr00t-n1d6", "run_id": "~~test1~~"}


1	+ {"project": "finetune-gr00t-n1d6", "run_id": "test6000"}