Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

cfg.yaml +201 -0
train-cfg.yaml +280 -0
wandb/run-20251225_195640-1lai13bo/files/cfg.yaml +201 -0
wandb/run-20251225_195640-1lai13bo/files/config.yaml +344 -0
wandb/run-20251225_195640-1lai13bo/files/train-cfg.yaml +280 -0

cfg.yaml ADDED Viewed

	@@ -0,0 +1,201 @@

+num_workers: 4
+prefetch_factor: 2
+split_seed: 42
+epoch_iterator: eager
+epochs: 121
+batch_size: 32
+grad_accum_steps: 1
+lr:
+  base: 5.0e-05
+  vlm_bridge: 1.0e-05
+  action_expert: 5.0e-05
+warmup_steps: 0
+cosine_anneal_epoch: 0
+betas:
+- 0.99
+- 0.9999
+eps: 1.0e-08
+weight_decay: 0.0001
+clip_grad_norm: 1.0
+exp_name: pi-training
+log_interval: 32
+eval_interval: 512
+save_interval: 40
+data:
+  _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+  root_path: null
+  action_horizon: null
+  state_history: null
+  input_transforms: []
+  output_transforms: []
+  output_inv_transforms: []
+  norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+  noise_cfg: null
+  repo_id: horipse01/lerobot_merged_restricted
+  bbox_only: false
+  remove_bbox: false
+  episodes: null
+  splits:
+  - .*
+train_data:
+  datasets:
+    action_a:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      batch_size: 64
+eval_data:
+  datasets:
+    action_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: sample_mse
+    action_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: sample_mse
+    generation_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: generation
+    generation_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: generation
+eval_num_sample_steps: 10
+eval_batch_size: 32
+policy:
+  _target_: vla_scratch.policies.pi.policy.PiPolicy
+  transforms:
+  - _target_: vla_scratch.policies.modules.vlm_bridge.qwen.processor.QwenProcessor
+    processor_class: Qwen3VLProcessor
+    model_id: Qwen/Qwen3-VL-2B-Instruct
+    max_length: 500
+    padding: max_length
+  state_history: 0
+  action_horizon: 10
+  state_dim: null
+  action_dim: null
+  vlm_type: Qwen3VLForConditionalGeneration
+  model_id: Qwen/Qwen3-VL-2B-Instruct
+  action_expert_cfg:
+    hidden_size: 1024
+    intermediate_size: 4096
+    num_attention_heads: 8
+    num_key_value_heads: 8
+    head_dim: 512
+    cross_attention_every: 2
+    qk_norm: layernorm
+    rotary_self_attn: true
+    only_attend_to_final_layer: true
+    attn_dropout: 0.0
+    mlp_dropout: 0.0
+    mlp_activation: silu
+    num_hidden_layers: 12
+    layers_for_dispersive_loss:
+    - 6
+    dispersive_loss_tau: 1.0
+    rms_norm_eps: 1.0e-06
+    attention_dropout: 0.0
+    attention_bias: true
+    max_position_embeddings: 8192
+    rope_theta: 10000.0
+  suffix_add_pos_emb: true
+  use_state: false
+  num_obs_registers: 4
+  expert_only_use_register: true
+  num_noise_per_sample: 2
+  num_noise_before_topk: 2
+  detach_kv_cache: false
+  ce_loss_weight: 0.1
+  disp_loss_weight: 0.0
+  time_dist_alpha: 1.0
+  time_dist_beta: 1.5
+  obs_register_init_gain: 0.02
+  suffix_pos_emb_init_gain: 0.02
+  zero_pos_id_for_obs_register: true
+  causal_mask_obs_register: true
+  qwen3_vl_use_grid_thw_list: true
+  qwen3_vl_recompute_pos_ids: false
+  qwen3_vl_masked_add_stack: true
+checkpoint_path: null
+load_optimizer: true
+wandb:
+  project: vla-scratch
+  mode: online
+  tags: []
+run_dir: /mnt/amlfs-01/home/hweng/projects/vla-scratch/vla-scratch/outputs/2025-12-25/19-55-39-pi-training
+world_size: 8

train-cfg.yaml ADDED Viewed

	@@ -0,0 +1,280 @@

+defaults:
+- _self_
+- policy: pi-qwen
+- data: libero-ipec
+- train_data: none
+- eval_data: none
+num_workers: 4
+prefetch_factor: 2
+split_seed: 42
+epoch_iterator: eager
+epochs: 121
+batch_size: 32
+grad_accum_steps: 1
+lr:
+  base: 5.0e-05
+  vlm_bridge: 1.0e-05
+  action_expert: 5.0e-05
+warmup_steps: 0
+cosine_anneal_epoch: 0
+betas:
+- 0.99
+- 0.9999
+eps: 1.0e-08
+weight_decay: 0.0001
+clip_grad_norm: 1.0
+exp_name: pi-training
+log_interval: 32
+eval_interval: 512
+save_interval: 40
+data:
+  _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+  root_path: null
+  action_horizon: null
+  state_history: null
+  input_transforms: []
+  output_transforms: []
+  output_inv_transforms: []
+  norm_stats_path: !!python/object/apply:pathlib.PosixPath
+  - normalization_stats
+  - bbox_cotrain
+  - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+  noise_cfg: null
+  repo_id: horipse01/lerobot_merged_restricted
+  bbox_only: false
+  remove_bbox: false
+  episodes: null
+  splits:
+  - .*
+train_data:
+  datasets:
+    action_a:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      batch_size: 64
+eval_data:
+  datasets:
+    action_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: sample_mse
+    action_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: sample_mse
+    generation_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: generation
+    generation_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: generation
+eval_num_sample_steps: 10
+eval_batch_size: 32
+policy:
+  _target_: vla_scratch.policies.pi.policy.PiPolicy
+  transforms:
+  - _target_: vla_scratch.policies.modules.vlm_bridge.qwen.processor.QwenProcessor
+    processor_class: Qwen3VLProcessor
+    model_id: Qwen/Qwen3-VL-2B-Instruct
+    max_length: 500
+    padding: max_length
+  state_history: 0
+  action_horizon: 10
+  state_dim: 1
+  action_dim: 7
+  vlm_type: Qwen3VLForConditionalGeneration
+  model_id: Qwen/Qwen3-VL-2B-Instruct
+  action_expert_cfg:
+    hidden_size: 1024
+    intermediate_size: 4096
+    num_attention_heads: 8
+    num_key_value_heads: 8
+    head_dim: 512
+    cross_attention_every: 2
+    qk_norm: layernorm
+    rotary_self_attn: true
+    only_attend_to_final_layer: true
+    attn_dropout: 0.0
+    mlp_dropout: 0.0
+    mlp_activation: silu
+    num_hidden_layers: 12
+    layers_for_dispersive_loss:
+    - 6
+    dispersive_loss_tau: 1.0
+    rms_norm_eps: 1.0e-06
+    attention_dropout: 0.0
+    attention_bias: true
+    max_position_embeddings: 8192
+    rope_theta: 10000.0
+  suffix_add_pos_emb: true
+  use_state: false
+  num_obs_registers: 4
+  expert_only_use_register: true
+  num_noise_per_sample: 2
+  num_noise_before_topk: 2
+  detach_kv_cache: false
+  ce_loss_weight: 0.1
+  disp_loss_weight: 0.0
+  time_dist_alpha: 1.0
+  time_dist_beta: 1.5
+  obs_register_init_gain: 0.02
+  suffix_pos_emb_init_gain: 0.02
+  zero_pos_id_for_obs_register: true
+  causal_mask_obs_register: true
+  qwen3_vl_use_grid_thw_list: true
+  qwen3_vl_recompute_pos_ids: false
+  qwen3_vl_masked_add_stack: true
+checkpoint_path: null
+load_optimizer: true
+wandb:
+  project: vla-scratch
+  mode: online
+  tags: []
+hydra:
+  defaults:
+  - output: default
+  - launcher: basic
+  - sweeper: basic
+  - help: default
+  - hydra_help: default
+  - hydra_logging: default
+  - job_logging: default
+  - callbacks: null
+  - env: default
+  mode: null
+  searchpath: []
+  run:
+    dir: .
+  sweep:
+    dir: ???
+    subdir: ???
+  hydra_logging: ???
+  job_logging: ???
+  sweeper: ???
+  launcher: ???
+  callbacks: {}
+  help:
+    app_name: ???
+    header: ???
+    footer: ???
+    template: ???
+  hydra_help:
+    hydra_help: ???
+    template: ???
+  output_subdir: null
+  overrides:
+    hydra: []
+    task: []
+  job:
+    name: ???
+    chdir: false
+    override_dirname: ???
+    id: ???
+    num: ???
+    config_name: ???
+    env_set: {}
+    env_copy: []
+    config:
+      override_dirname:
+        kv_sep: '='
+        item_sep: ','
+        exclude_keys: []
+  runtime:
+    version: ???
+    version_base: ???
+    cwd: ???
+    config_sources: ???
+    output_dir: ???
+    choices: {}
+  verbose: false

wandb/run-20251225_195640-1lai13bo/files/cfg.yaml ADDED Viewed

	@@ -0,0 +1,201 @@

+num_workers: 4
+prefetch_factor: 2
+split_seed: 42
+epoch_iterator: eager
+epochs: 121
+batch_size: 32
+grad_accum_steps: 1
+lr:
+  base: 5.0e-05
+  vlm_bridge: 1.0e-05
+  action_expert: 5.0e-05
+warmup_steps: 0
+cosine_anneal_epoch: 0
+betas:
+- 0.99
+- 0.9999
+eps: 1.0e-08
+weight_decay: 0.0001
+clip_grad_norm: 1.0
+exp_name: pi-training
+log_interval: 32
+eval_interval: 512
+save_interval: 40
+data:
+  _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+  root_path: null
+  action_horizon: null
+  state_history: null
+  input_transforms: []
+  output_transforms: []
+  output_inv_transforms: []
+  norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+  noise_cfg: null
+  repo_id: horipse01/lerobot_merged_restricted
+  bbox_only: false
+  remove_bbox: false
+  episodes: null
+  splits:
+  - .*
+train_data:
+  datasets:
+    action_a:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      batch_size: 64
+eval_data:
+  datasets:
+    action_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: sample_mse
+    action_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: sample_mse
+    generation_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: generation
+    generation_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: null
+        state_history: null
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: generation
+eval_num_sample_steps: 10
+eval_batch_size: 32
+policy:
+  _target_: vla_scratch.policies.pi.policy.PiPolicy
+  transforms:
+  - _target_: vla_scratch.policies.modules.vlm_bridge.qwen.processor.QwenProcessor
+    processor_class: Qwen3VLProcessor
+    model_id: Qwen/Qwen3-VL-2B-Instruct
+    max_length: 500
+    padding: max_length
+  state_history: 0
+  action_horizon: 10
+  state_dim: null
+  action_dim: null
+  vlm_type: Qwen3VLForConditionalGeneration
+  model_id: Qwen/Qwen3-VL-2B-Instruct
+  action_expert_cfg:
+    hidden_size: 1024
+    intermediate_size: 4096
+    num_attention_heads: 8
+    num_key_value_heads: 8
+    head_dim: 512
+    cross_attention_every: 2
+    qk_norm: layernorm
+    rotary_self_attn: true
+    only_attend_to_final_layer: true
+    attn_dropout: 0.0
+    mlp_dropout: 0.0
+    mlp_activation: silu
+    num_hidden_layers: 12
+    layers_for_dispersive_loss:
+    - 6
+    dispersive_loss_tau: 1.0
+    rms_norm_eps: 1.0e-06
+    attention_dropout: 0.0
+    attention_bias: true
+    max_position_embeddings: 8192
+    rope_theta: 10000.0
+  suffix_add_pos_emb: true
+  use_state: false
+  num_obs_registers: 4
+  expert_only_use_register: true
+  num_noise_per_sample: 2
+  num_noise_before_topk: 2
+  detach_kv_cache: false
+  ce_loss_weight: 0.1
+  disp_loss_weight: 0.0
+  time_dist_alpha: 1.0
+  time_dist_beta: 1.5
+  obs_register_init_gain: 0.02
+  suffix_pos_emb_init_gain: 0.02
+  zero_pos_id_for_obs_register: true
+  causal_mask_obs_register: true
+  qwen3_vl_use_grid_thw_list: true
+  qwen3_vl_recompute_pos_ids: false
+  qwen3_vl_masked_add_stack: true
+checkpoint_path: null
+load_optimizer: true
+wandb:
+  project: vla-scratch
+  mode: online
+  tags: []
+run_dir: /mnt/amlfs-01/home/hweng/projects/vla-scratch/vla-scratch/outputs/2025-12-25/19-55-39-pi-training
+world_size: 8

wandb/run-20251225_195640-1lai13bo/files/config.yaml ADDED Viewed

	@@ -0,0 +1,344 @@

+_wandb:
+    value:
+        cli_version: 0.21.4
+        e:
+            gt1vdj22y3nl3q7a422smxub7piq9xeu:
+                args:
+                    - policy=pi-qwen
+                    - policy.state_history=0
+                    - policy.action_horizon=10
+                    - policy.transforms.0.max_length=500
+                    - data=bbox_cotrain_train
+                    - batch_size=32
+                    - train_data=bbox_cotrain_baseline
+                    - train_data.datasets.action_a.batch_size=64
+                    - eval_data=bbox_cotrain_eval
+                    - num_workers=4
+                    - prefetch_factor=2
+                    - lr.base=5e-5
+                    - +lr.vlm_bridge=1e-5
+                    - +lr.action_expert=5e-5
+                    - epochs=121
+                    - save_interval=40
+                    - wandb.mode=online
+                cpu_count: 96
+                cpu_count_logical: 96
+                cudaVersion: "13.0"
+                disk:
+                    /:
+                        total: "1065418129408"
+                        used: "726712709120"
+                email: elijahgalahad@gmail.com
+                executable: /mnt/amlfs-01/home/hweng/projects/vla-scratch/vla-scratch/.venv/bin/python3
+                gpu: NVIDIA H100 80GB HBM3
+                gpu_count: 8
+                gpu_nvidia:
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-83bb76f3-06ce-7f65-9aff-97f16dbac4ce
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-6734b808-316d-13ad-3452-190c89899f8e
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-bf6464b4-ee22-dd87-184c-579e33ac7b15
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-d819de6f-6573-c624-1294-02a3acedf344
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-88262183-ce36-a48f-dc17-3bde9f4de8f3
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-98d3e6fa-f573-2b1a-79fd-01c89d027d23
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-34bb43c6-303f-2a7c-4ede-99e51fc3e28f
+                    - architecture: Hopper
+                      cudaCores: 16896
+                      memoryTotal: "85520809984"
+                      name: NVIDIA H100 80GB HBM3
+                      uuid: GPU-e30f59ec-7f5f-4c37-3417-33fccebb8823
+                host: 5c26df9320f14086-197be6b49fe441a3
+                memory:
+                    total: "2008083251200"
+                os: Linux-5.15.0-1098-azure-x86_64-with-glibc2.35
+                program: /mnt/amlfs-01/home/hweng/projects/vla-scratch/vla-scratch/scripts/train_policy.py
+                python: CPython 3.10.12
+                root: /mnt/amlfs-01/home/hweng/projects/vla-scratch/vla-scratch/outputs/2025-12-25/19-55-39-pi-training
+                startedAt: "2025-12-26T03:56:40.589357Z"
+                writerId: gt1vdj22y3nl3q7a422smxub7piq9xeu
+        m: []
+        python_version: 3.10.12
+        t:
+            "1":
+                - 1
+                - 11
+                - 41
+                - 49
+                - 50
+                - 51
+                - 71
+                - 105
+            "2":
+                - 1
+                - 11
+                - 41
+                - 49
+                - 50
+                - 51
+                - 71
+                - 105
+            "3":
+                - 3
+                - 15
+                - 17
+            "4": 3.10.12
+            "5": 0.21.4
+            "6": 4.57.1
+            "12": 0.21.4
+            "13": linux-x86_64
+batch_size:
+    value: 32
+betas:
+    value:
+        - 0.99
+        - 0.9999
+checkpoint_path:
+    value: null
+clip_grad_norm:
+    value: 1
+cosine_anneal_epoch:
+    value: 0
+data:
+    value:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        action_horizon: null
+        bbox_only: false
+        episodes: null
+        input_transforms: []
+        noise_cfg: null
+        norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        output_inv_transforms: []
+        output_transforms: []
+        remove_bbox: false
+        repo_id: horipse01/lerobot_merged_restricted
+        root_path: null
+        splits:
+            - .*
+        state_history: null
+epoch_iterator:
+    value: eager
+epochs:
+    value: 121
+eps:
+    value: 1e-08
+eval_batch_size:
+    value: 32
+eval_data:
+    value:
+        datasets:
+            action_test:
+                data:
+                    _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+                    action_horizon: null
+                    bbox_only: false
+                    episodes: null
+                    input_transforms: []
+                    noise_cfg: null
+                    norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+                    output_inv_transforms: []
+                    output_transforms: []
+                    remove_bbox: false
+                    repo_id: horipse01/lerobot_merged_restricted_val
+                    root_path: null
+                    splits:
+                        - .*
+                    state_history: null
+                eval_fraction: 0.1
+                eval_type: sample_mse
+            action_train:
+                data:
+                    _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+                    action_horizon: null
+                    bbox_only: false
+                    episodes: null
+                    input_transforms: []
+                    noise_cfg: null
+                    norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+                    output_inv_transforms: []
+                    output_transforms: []
+                    remove_bbox: false
+                    repo_id: horipse01/lerobot_merged_restricted
+                    root_path: null
+                    splits:
+                        - .*
+                    state_history: null
+                eval_fraction: 0.02
+                eval_type: sample_mse
+            generation_test:
+                data:
+                    _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+                    action_horizon: null
+                    bbox_only: true
+                    episodes: null
+                    input_transforms: []
+                    noise_cfg: null
+                    norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+                    output_inv_transforms: []
+                    output_transforms: []
+                    remove_bbox: false
+                    repo_id: horipse01/lerobot_merged_restricted_val
+                    root_path: null
+                    splits:
+                        - .*
+                    state_history: null
+                eval_fraction: 0.1
+                eval_type: generation
+            generation_train:
+                data:
+                    _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+                    action_horizon: null
+                    bbox_only: true
+                    episodes: null
+                    input_transforms: []
+                    noise_cfg: null
+                    norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+                    output_inv_transforms: []
+                    output_transforms: []
+                    remove_bbox: false
+                    repo_id: horipse01/lerobot_merged_restricted
+                    root_path: null
+                    splits:
+                        - .*
+                    state_history: null
+                eval_fraction: 0.02
+                eval_type: generation
+eval_interval:
+    value: 512
+eval_num_sample_steps:
+    value: 10
+exp_name:
+    value: pi-training
+grad_accum_steps:
+    value: 1
+load_optimizer:
+    value: true
+log_interval:
+    value: 32
+lr:
+    value:
+        action_expert: 5e-05
+        base: 5e-05
+        vlm_bridge: 1e-05
+num_workers:
+    value: 4
+policy:
+    value:
+        _target_: vla_scratch.policies.pi.policy.PiPolicy
+        action_dim: null
+        action_expert_cfg:
+            attention_bias: true
+            attention_dropout: 0
+            attn_dropout: 0
+            cross_attention_every: 2
+            dispersive_loss_tau: 1
+            head_dim: 512
+            hidden_size: 1024
+            intermediate_size: 4096
+            layers_for_dispersive_loss:
+                - 6
+            max_position_embeddings: 8192
+            mlp_activation: silu
+            mlp_dropout: 0
+            num_attention_heads: 8
+            num_hidden_layers: 12
+            num_key_value_heads: 8
+            only_attend_to_final_layer: true
+            qk_norm: layernorm
+            rms_norm_eps: 1e-06
+            rope_theta: 10000
+            rotary_self_attn: true
+        action_horizon: 10
+        causal_mask_obs_register: true
+        ce_loss_weight: 0.1
+        detach_kv_cache: false
+        disp_loss_weight: 0
+        expert_only_use_register: true
+        model_id: Qwen/Qwen3-VL-2B-Instruct
+        num_noise_before_topk: 2
+        num_noise_per_sample: 2
+        num_obs_registers: 4
+        obs_register_init_gain: 0.02
+        qwen3_vl_masked_add_stack: true
+        qwen3_vl_recompute_pos_ids: false
+        qwen3_vl_use_grid_thw_list: true
+        state_dim: null
+        state_history: 0
+        suffix_add_pos_emb: true
+        suffix_pos_emb_init_gain: 0.02
+        time_dist_alpha: 1
+        time_dist_beta: 1.5
+        transforms:
+            - _target_: vla_scratch.policies.modules.vlm_bridge.qwen.processor.QwenProcessor
+              max_length: 500
+              model_id: Qwen/Qwen3-VL-2B-Instruct
+              padding: max_length
+              processor_class: Qwen3VLProcessor
+        use_state: false
+        vlm_type: Qwen3VLForConditionalGeneration
+        zero_pos_id_for_obs_register: true
+prefetch_factor:
+    value: 2
+run_dir:
+    value: /mnt/amlfs-01/home/hweng/projects/vla-scratch/vla-scratch/outputs/2025-12-25/19-55-39-pi-training
+save_interval:
+    value: 40
+split_seed:
+    value: 42
+train_data:
+    value:
+        datasets:
+            action_a:
+                batch_size: 64
+                data:
+                    _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+                    action_horizon: null
+                    bbox_only: false
+                    episodes: null
+                    input_transforms: []
+                    noise_cfg: null
+                    norm_stats_path: normalization_stats/bbox_cotrain/lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+                    output_inv_transforms: []
+                    output_transforms: []
+                    remove_bbox: false
+                    repo_id: horipse01/lerobot_merged_restricted
+                    root_path: null
+                    splits:
+                        - .*
+                    state_history: null
+wandb:
+    value:
+        mode: online
+        project: vla-scratch
+        tags: []
+warmup_steps:
+    value: 0
+weight_decay:
+    value: 0.0001
+world_size:
+    value: 8

wandb/run-20251225_195640-1lai13bo/files/train-cfg.yaml ADDED Viewed

	@@ -0,0 +1,280 @@

+defaults:
+- _self_
+- policy: pi-qwen
+- data: libero-ipec
+- train_data: none
+- eval_data: none
+num_workers: 4
+prefetch_factor: 2
+split_seed: 42
+epoch_iterator: eager
+epochs: 121
+batch_size: 32
+grad_accum_steps: 1
+lr:
+  base: 5.0e-05
+  vlm_bridge: 1.0e-05
+  action_expert: 5.0e-05
+warmup_steps: 0
+cosine_anneal_epoch: 0
+betas:
+- 0.99
+- 0.9999
+eps: 1.0e-08
+weight_decay: 0.0001
+clip_grad_norm: 1.0
+exp_name: pi-training
+log_interval: 32
+eval_interval: 512
+save_interval: 40
+data:
+  _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+  root_path: null
+  action_horizon: null
+  state_history: null
+  input_transforms: []
+  output_transforms: []
+  output_inv_transforms: []
+  norm_stats_path: !!python/object/apply:pathlib.PosixPath
+  - normalization_stats
+  - bbox_cotrain
+  - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+  noise_cfg: null
+  repo_id: horipse01/lerobot_merged_restricted
+  bbox_only: false
+  remove_bbox: false
+  episodes: null
+  splits:
+  - .*
+train_data:
+  datasets:
+    action_a:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      batch_size: 64
+eval_data:
+  datasets:
+    action_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: sample_mse
+    action_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: false
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: sample_mse
+    generation_train:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.02
+      eval_type: generation
+    generation_test:
+      data:
+        _target_: vla_scratch.datasets.bbox_cotrain.dataset.CoTrainDataset
+        root_path: null
+        action_horizon: 10
+        state_history: 0
+        input_transforms: []
+        output_transforms: []
+        output_inv_transforms: []
+        norm_stats_path: !!python/object/apply:pathlib.PosixPath
+        - normalization_stats
+        - bbox_cotrain
+        - lerobot_norm_stats-horizon_{data.action_horizon}-history_{data.state_history}.npz
+        noise_cfg: null
+        repo_id: horipse01/lerobot_merged_restricted_val
+        bbox_only: true
+        remove_bbox: false
+        episodes: null
+        splits:
+        - .*
+      eval_fraction: 0.1
+      eval_type: generation
+eval_num_sample_steps: 10
+eval_batch_size: 32
+policy:
+  _target_: vla_scratch.policies.pi.policy.PiPolicy
+  transforms:
+  - _target_: vla_scratch.policies.modules.vlm_bridge.qwen.processor.QwenProcessor
+    processor_class: Qwen3VLProcessor
+    model_id: Qwen/Qwen3-VL-2B-Instruct
+    max_length: 500
+    padding: max_length
+  state_history: 0
+  action_horizon: 10
+  state_dim: 1
+  action_dim: 7
+  vlm_type: Qwen3VLForConditionalGeneration
+  model_id: Qwen/Qwen3-VL-2B-Instruct
+  action_expert_cfg:
+    hidden_size: 1024
+    intermediate_size: 4096
+    num_attention_heads: 8
+    num_key_value_heads: 8
+    head_dim: 512
+    cross_attention_every: 2
+    qk_norm: layernorm
+    rotary_self_attn: true
+    only_attend_to_final_layer: true
+    attn_dropout: 0.0
+    mlp_dropout: 0.0
+    mlp_activation: silu
+    num_hidden_layers: 12
+    layers_for_dispersive_loss:
+    - 6
+    dispersive_loss_tau: 1.0
+    rms_norm_eps: 1.0e-06
+    attention_dropout: 0.0
+    attention_bias: true
+    max_position_embeddings: 8192
+    rope_theta: 10000.0
+  suffix_add_pos_emb: true
+  use_state: false
+  num_obs_registers: 4
+  expert_only_use_register: true
+  num_noise_per_sample: 2
+  num_noise_before_topk: 2
+  detach_kv_cache: false
+  ce_loss_weight: 0.1
+  disp_loss_weight: 0.0
+  time_dist_alpha: 1.0
+  time_dist_beta: 1.5
+  obs_register_init_gain: 0.02
+  suffix_pos_emb_init_gain: 0.02
+  zero_pos_id_for_obs_register: true
+  causal_mask_obs_register: true
+  qwen3_vl_use_grid_thw_list: true
+  qwen3_vl_recompute_pos_ids: false
+  qwen3_vl_masked_add_stack: true
+checkpoint_path: null
+load_optimizer: true
+wandb:
+  project: vla-scratch
+  mode: online
+  tags: []
+hydra:
+  defaults:
+  - output: default
+  - launcher: basic
+  - sweeper: basic
+  - help: default
+  - hydra_help: default
+  - hydra_logging: default
+  - job_logging: default
+  - callbacks: null
+  - env: default
+  mode: null
+  searchpath: []
+  run:
+    dir: .
+  sweep:
+    dir: ???
+    subdir: ???
+  hydra_logging: ???
+  job_logging: ???
+  sweeper: ???
+  launcher: ???
+  callbacks: {}
+  help:
+    app_name: ???
+    header: ???
+    footer: ???
+    template: ???
+  hydra_help:
+    hydra_help: ???
+    template: ???
+  output_subdir: null
+  overrides:
+    hydra: []
+    task: []
+  job:
+    name: ???
+    chdir: false
+    override_dirname: ???
+    id: ???
+    num: ???
+    config_name: ???
+    env_set: {}
+    env_copy: []
+    config:
+      override_dirname:
+        kv_sep: '='
+        item_sep: ','
+        exclude_keys: []
+  runtime:
+    version: ???
+    version_base: ???
+    cwd: ???
+    config_sources: ???
+    output_dir: ???
+    choices: {}
+  verbose: false