Upload folder using huggingface_hub

Browse files

Files changed (4) hide show

InternVLPI-0302-eep-pretrain_T2_sft_23000/checkpoints/steps_23000_pytorch_model.pt +3 -0
InternVLPI-0302-eep-pretrain_T2_sft_23000/config.json +107 -0
InternVLPI-0302-eep-pretrain_T2_sft_23000/config.yaml +68 -0
InternVLPI-0302-eep-pretrain_T2_sft_23000/dataset_statistics.json +218 -0

InternVLPI-0302-eep-pretrain_T2_sft_23000/checkpoints/steps_23000_pytorch_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8d9bac614da20ddb00d404628a2c2ece9368a01e27804905f9ae1c4b9538494
+size 2966606180

InternVLPI-0302-eep-pretrain_T2_sft_23000/config.json ADDED Viewed

	@@ -0,0 +1,107 @@

+{
+  "run_id": "InternVLPI-0302-eep-pretrain_T2_sft",
+  "run_root_dir": "/lumos-vePFS/shenzhen/models/lumos_pi",
+  "seed": 42,
+  "trackers": [
+    "jsonl"
+  ],
+  "wandb_entity": null,
+  "wandb_project": null,
+  "is_debug": false,
+  "framework": {
+    "name": "internvlPI",
+    "qwenvl": {
+      "base_vlm": "/lumos-vePFS/shenzhen/models/InternVL3_5-1B-Instruct",
+      "attn_implementation": "eager",
+      "vl_hidden_dim": 2048
+    },
+    "action_model": {
+      "add_pos_embed": true,
+      "hidden_size": 1024,
+      "max_seq_len": 1024,
+      "action_model_type": "DiT-B",
+      "action_dim": 20,
+      "state_dim": 20,
+      "future_action_window_size": 15,
+      "past_action_window_size": 0,
+      "action_horizon": 30,
+      "repeated_diffusion_steps": 2,
+      "noise_beta_alpha": 1.5,
+      "noise_beta_beta": 1.0,
+      "noise_s": 0.999,
+      "num_timestep_buckets": 1000,
+      "num_inference_timesteps": 8,
+      "num_target_vision_tokens": 32,
+      "use_scaled_noise": true,
+      "use_kv_cache_dit": true,
+      "diffusion_model_cfg": {
+        "dropout": 0.2,
+        "final_dropout": true,
+        "interleave_self_attention": true,
+        "norm_type": "ada_norm",
+        "num_layers": 28,
+        "output_dim": 2560,
+        "positional_embeddings": null
+      },
+      "smoothness_loss_weight": 1
+    }
+  },
+  "datasets": {
+    "vla_data": {
+      "dataset_py": "lerobot_datasets",
+      "data_root_dir": "/lumos-vePFS/shenzhen/data/data_warehouse/data_warehouse_output_clean",
+      "data_mix": "train_QwenPI",
+      "per_device_batch_size": 16,
+      "num_workers": 4,
+      "action_type": "abs_ee",
+      "image_size": 256,
+      "video_backend": "pyav"
+    }
+  },
+  "trainer": {
+    "epochs": 100,
+    "max_train_steps": 200000,
+    "num_warmup_steps": 5000,
+    "save_interval": 1000,
+    "eval_interval": 10000000,
+    "learning_rate": {
+      "base": 1e-05,
+      "intern_vl_interface": 1e-05,
+      "action_model": 0.0001
+    },
+    "lr_scheduler_type": "cosine_with_min_lr",
+    "scheduler_specific_kwargs": {
+      "min_lr": 1e-06
+    },
+    "freeze_modules": null,
+    "loss_scale": {
+      "vla": 1.0,
+      "vlm": 0.05
+    },
+    "max_grad_norm": 1.0,
+    "warmup_ratio": 0.1,
+    "weight_decay": 0.0,
+    "logging_frequency": 10,
+    "gradient_clipping": 1.0,
+    "gradient_accumulation_steps": 3,
+    "optimizer": {
+      "name": "AdamW",
+      "betas": [
+        0.9,
+        0.95
+      ],
+      "eps": 1e-08,
+      "weight_decay": 0
+    },
+    "pretrained_checkpoint": "/lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI-0225-eep-pretrain_T2/checkpoints/steps_23000_pytorch_model.pt",
+    "is_resume": true,
+    "resume_step": 11000
+  },
+  "is_resume": true,
+  "resume_epoch": null,
+  "resume_step": 5000,
+  "enable_gradient_checkpointing": true,
+  "enable_mixed_precision_training": true,
+  "report_to": "jsonl",
+  "output_dir": "/lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI-0302-eep-pretrain_T2_sft"
+}

InternVLPI-0302-eep-pretrain_T2_sft_23000/config.yaml ADDED Viewed

	@@ -0,0 +1,68 @@

+datasets:
+  vla_data:
+    data_mix: train_QwenPI
+    data_root_dir: /lumos-vePFS/shenzhen/data/data_warehouse/data_warehouse_output_clean
+    dataset_py: lerobot_datasets
+    image_size: 256
+    num_workers: 4
+    per_device_batch_size: 16
+framework:
+  action_model:
+    action_dim: 20
+    add_pos_embed: true
+    diffusion_model_cfg:
+      dropout: 0.2
+      final_dropout: true
+      interleave_self_attention: true
+      norm_type: ada_norm
+      num_layers: 28
+      output_dim: 2560
+      positional_embeddings: null
+    future_action_window_size: 15
+    hidden_dim: 1024
+    max_seq_len: 1024
+    noise_beta_alpha: 1.5
+    noise_beta_beta: 1.0
+    noise_s: 0.999
+    num_inference_timesteps: 8
+    num_target_vision_tokens: 32
+    num_timestep_buckets: 1000
+    past_action_window_size: 0
+    smoothness_loss_weight: 1
+    state_dim: 20
+    use_kv_cache_dit: true
+    use_scaled_noise: true
+  name: internvlPI
+  qwenvl:
+    attn_implementation: eager
+    base_vlm: /lumos-vePFS/shenzhen/models/InternVL3_5-1B-Instruct
+    num_vl_layers: 28
+    vl_hidden_dim: 1024
+output_dir: /lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI-0302-eep-pretrain_T2_sft
+run_id: InternVLPI-0302-eep-pretrain_T2_sft
+run_root_dir: /lumos-vePFS/shenzhen/models/lumos_pi
+seed: 42
+trainer:
+  eval_interval: 10000000
+  freeze_modules: null
+  gradient_accumulation_steps: 3
+  gradient_clipping: 1.0
+  is_resume: true
+  learning_rate:
+    action_model: 0.0001
+    base: 1.0e-05
+    intern_vl_interface: 1.0e-05
+  logging_frequency: 10
+  lr_scheduler_type: cosine_with_min_lr
+  max_train_steps: 200000
+  num_warmup_steps: 5000
+  optimizer:
+    betas:
+    - 0.9
+    - 0.95
+    eps: 1.0e-08
+    weight_decay: 0
+  pretrained_checkpoint: /lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI-0225-eep-pretrain_T2/checkpoints/steps_23000_pytorch_model.pt
+  save_interval: 1000
+  scheduler_specific_kwargs:
+    min_lr: 1.0e-06

InternVLPI-0302-eep-pretrain_T2_sft_23000/dataset_statistics.json ADDED Viewed

	@@ -0,0 +1,218 @@

+{
+  "new_embodiment": {
+    "action": {
+      "mean": [
+        0.2675580734556372,
+        -0.06659615870739799,
+        0.19635865566405383,
+        -1.313161190599203,
+        0.41478794440627087,
+        1.4886140796271237,
+        0.0327876329168,
+        0.2434083236889406,
+        0.09594157693738284,
+        0.20976496081460608,
+        1.4955806767737323,
+        0.5106299925934186,
+        -1.5047886750914834,
+        0.035419227597727025
+      ],
+      "std": [
+        0.10220121447453302,
+        0.11127593499077473,
+        0.0693507274854023,
+        2.61021122878121,
+        0.31264831774938195,
+        2.385310375748136,
+        0.028368956930127334,
+        0.09613372647295047,
+        0.08261520968608296,
+        0.05838800456095643,
+        2.516367436105295,
+        0.2863539402986677,
+        2.4039184089857386,
+        0.028089917285829002
+      ],
+      "max": [
+        0.5965149998664856,
+        0.48442599177360535,
+        0.6967939734458923,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.0810599997639656,
+        0.5695070028305054,
+        0.4637550115585327,
+        0.6456500291824341,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.061319999396800995
+      ],
+      "min": [
+        -0.10788500308990479,
+        -0.5191159844398499,
+        0.040369000285863876,
+        -3.1410515308380127,
+        -1.5302174091339111,
+        -3.1410515308380127,
+        -0.0017500000540167093,
+        -0.03119499981403351,
+        -0.356126993894577,
+        0.06903599947690964,
+        -3.141069173812866,
+        -0.7706850171089172,
+        -3.1410515308380127,
+        0.0
+      ],
+      "q01": [
+        0.03489213060587645,
+        -0.36912800788879396,
+        0.07184209674596786,
+        -3.137246325016022,
+        -0.20070483744144438,
+        -3.137392144203186,
+        0.0,
+        0.030881709717214108,
+        -0.15914200246334076,
+        0.10170399993658066,
+        -3.138237874507904,
+        -0.11282174646854401,
+        -3.1362587141990663,
+        7.000000186963007e-05
+      ],
+      "q99": [
+        0.5328979176282882,
+        0.41213971734046934,
+        0.47792605459690085,
+        3.1415927410125732,
+        1.5365502309799193,
+        3.1415927410125732,
+        0.06019999831914902,
+        0.5246558457612991,
+        0.35473266333341585,
+        0.42531779676675785,
+        3.1415927410125732,
+        1.5435859155654907,
+        3.1415927410125732,
+        0.05992000177502632
+      ],
+      "mask": [
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false
+      ]
+    },
+    "state": {
+      "mean": [
+        0.2675580734556372,
+        -0.06659615870739799,
+        0.19635865566405383,
+        -1.313161190599203,
+        0.41478794440627087,
+        1.4886140796271237,
+        0.0327876329168,
+        0.2434083236889406,
+        0.09594157693738284,
+        0.20976496081460608,
+        1.4955806767737323,
+        0.5106299925934186,
+        -1.5047886750914834,
+        0.035419227597727025
+      ],
+      "std": [
+        0.10220121447453302,
+        0.11127593499077473,
+        0.0693507274854023,
+        2.61021122878121,
+        0.31264831774938195,
+        2.385310375748136,
+        0.028368956930127334,
+        0.09613372647295047,
+        0.08261520968608296,
+        0.05838800456095643,
+        2.516367436105295,
+        0.2863539402986677,
+        2.4039184089857386,
+        0.028089917285829002
+      ],
+      "max": [
+        0.5965149998664856,
+        0.48442599177360535,
+        0.6967939734458923,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.0810599997639656,
+        0.5695070028305054,
+        0.4637550115585327,
+        0.6456500291824341,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.061319999396800995
+      ],
+      "min": [
+        -0.10788500308990479,
+        -0.5191159844398499,
+        0.040369000285863876,
+        -3.1410515308380127,
+        -1.5302174091339111,
+        -3.1410515308380127,
+        -0.0017500000540167093,
+        -0.03119499981403351,
+        -0.356126993894577,
+        0.06903599947690964,
+        -3.141069173812866,
+        -0.7706850171089172,
+        -3.1410515308380127,
+        0.0
+      ],
+      "q01": [
+        0.03489213060587645,
+        -0.36912800788879396,
+        0.07184209674596786,
+        -3.137246325016022,
+        -0.20070483744144438,
+        -3.137392144203186,
+        0.0,
+        0.030881709717214108,
+        -0.15914200246334076,
+        0.10170399993658066,
+        -3.138237874507904,
+        -0.11282174646854401,
+        -3.1362587141990663,
+        7.000000186963007e-05
+      ],
+      "q99": [
+        0.5328979176282882,
+        0.41213971734046934,
+        0.47792605459690085,
+        3.1415927410125732,
+        1.5365502309799193,
+        3.1415927410125732,
+        0.06019999831914902,
+        0.5246558457612991,
+        0.35473266333341585,
+        0.42531779676675785,
+        3.1415927410125732,
+        1.5435859155654907,
+        3.1415927410125732,
+        0.05992000177502632
+      ]
+    },
+    "num_transitions": 3335583,
+    "num_trajectories": 2411
+  }
+}