Upload folder using huggingface_hub

Browse files

Files changed (4) hide show

InternVLPI05-0302-eep_2222_127000/checkpoints/steps_127000_pytorch_model.pt +3 -0
InternVLPI05-0302-eep_2222_127000/config.json +104 -0
InternVLPI05-0302-eep_2222_127000/config.yaml +67 -0
InternVLPI05-0302-eep_2222_127000/dataset_statistics.json +218 -0

InternVLPI05-0302-eep_2222_127000/checkpoints/steps_127000_pytorch_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:89285d55289afa919301590c28d52db23a6e38fc7594fb687af2d033b8bf2760
+size 2853231794

InternVLPI05-0302-eep_2222_127000/config.json ADDED Viewed

	@@ -0,0 +1,104 @@

+{
+  "run_id": "InternVLPI05-0302-eep_2222",
+  "run_root_dir": "/lumos-vePFS/shenzhen/models/lumos_pi",
+  "seed": 42,
+  "trackers": [
+    "jsonl"
+  ],
+  "wandb_entity": null,
+  "wandb_project": null,
+  "is_debug": false,
+  "framework": {
+    "name": "internvlPI_adaRMS",
+    "qwenvl": {
+      "base_vlm": "/lumos-vePFS/shenzhen/models/InternVL3_5-1B-Instruct",
+      "attn_implementation": "eager",
+      "vl_hidden_dim": 2048
+    },
+    "action_model": {
+      "add_pos_embed": true,
+      "hidden_size": 1024,
+      "max_seq_len": 1024,
+      "action_model_type": "DiT-B",
+      "action_dim": 20,
+      "state_dim": 20,
+      "future_action_window_size": 15,
+      "past_action_window_size": 0,
+      "action_horizon": 30,
+      "repeated_diffusion_steps": 2,
+      "noise_beta_alpha": 1.5,
+      "noise_beta_beta": 1.0,
+      "noise_s": 0.999,
+      "num_timestep_buckets": 1000,
+      "num_inference_timesteps": 8,
+      "num_target_vision_tokens": 32,
+      "use_scaled_noise": true,
+      "diffusion_model_cfg": {
+        "dropout": 0.2,
+        "final_dropout": true,
+        "interleave_self_attention": true,
+        "norm_type": "ada_rms",
+        "num_layers": 28,
+        "output_dim": 2560,
+        "positional_embeddings": null
+      },
+      "smoothness_loss_weight": 1,
+      "use_kv_cache_dit": true
+    }
+  },
+  "datasets": {
+    "vla_data": {
+      "dataset_py": "lerobot_datasets",
+      "data_root_dir": "/lumos-vePFS/shenzhen/data/data_warehouse/data_warehouse_output_clean",
+      "data_mix": "train_QwenPI",
+      "per_device_batch_size": 16,
+      "num_workers": 2,
+      "action_type": "abs_ee",
+      "image_size": 256,
+      "video_backend": "pyav"
+    }
+  },
+  "trainer": {
+    "epochs": 100,
+    "max_train_steps": 200000,
+    "num_warmup_steps": 5000,
+    "save_interval": 1000,
+    "eval_interval": 10000000,
+    "learning_rate": {
+      "base": 1e-05,
+      "intern_vl_interface": 1e-05,
+      "action_model": 0.0001
+    },
+    "lr_scheduler_type": "cosine_with_min_lr",
+    "scheduler_specific_kwargs": {
+      "min_lr": 1e-06
+    },
+    "freeze_modules": null,
+    "loss_scale": {
+      "vla": 1.0,
+      "vlm": 0.05
+    },
+    "max_grad_norm": 1.0,
+    "warmup_ratio": 0.1,
+    "weight_decay": 0.0,
+    "logging_frequency": 10,
+    "gradient_clipping": 1.0,
+    "gradient_accumulation_steps": 2,
+    "optimizer": {
+      "name": "AdamW",
+      "betas": [
+        0.9,
+        0.95
+      ],
+      "eps": 1e-08,
+      "weight_decay": 0
+    }
+  },
+  "is_resume": true,
+  "resume_epoch": null,
+  "resume_step": 5000,
+  "enable_gradient_checkpointing": true,
+  "enable_mixed_precision_training": true,
+  "report_to": "jsonl",
+  "output_dir": "/lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI05-0302-eep_2222"
+}

InternVLPI05-0302-eep_2222_127000/config.yaml ADDED Viewed

	@@ -0,0 +1,67 @@

+datasets:
+  vla_data:
+    data_mix: train_QwenPI
+    data_root_dir: /lumos-vePFS/shenzhen/data/data_warehouse/data_warehouse_output_clean
+    dataset_py: lerobot_datasets
+    image_size: 256
+    num_workers: 2
+    per_device_batch_size: 16
+framework:
+  action_model:
+    action_dim: 20
+    add_pos_embed: true
+    diffusion_model_cfg:
+      cross_attention_dim: 1024
+      dropout: 0.2
+      final_dropout: true
+      interleave_self_attention: true
+      norm_elementwise_affine: false
+      norm_type: ada_rms
+      num_layers: 28
+      output_dim: 2560
+      positional_embeddings: null
+    future_action_window_size: 15
+    hidden_dim: 1024
+    max_seq_len: 1024
+    noise_beta_alpha: 1.5
+    noise_beta_beta: 1.0
+    noise_s: 0.999
+    num_inference_timesteps: 8
+    num_target_vision_tokens: 32
+    num_timestep_buckets: 1000
+    past_action_window_size: 0
+    smoothness_loss_weight: 1
+    state_dim: 20
+    use_kv_cache_dit: true
+    use_scaled_noise: true
+  name: internvlPI_adaRMS
+  qwenvl:
+    attn_implementation: eager
+    base_vlm: /lumos-vePFS/shenzhen/models/InternVL3_5-1B-Instruct
+    num_vl_layers: 28
+    vl_hidden_dim: 1024
+output_dir: /lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI05-0302-eep_2222
+run_id: InternVLPI05-0302-eep_2222
+run_root_dir: /lumos-vePFS/shenzhen/models/lumos_pi
+seed: 42
+trainer:
+  freeze_modules: null
+  gradient_accumulation_steps: 2
+  gradient_clipping: 1.0
+  learning_rate:
+    action_model: 0.0001
+    base: 1.0e-05
+    intern_vl_interface: 1.0e-05
+  logging_frequency: 10
+  lr_scheduler_type: cosine_with_min_lr
+  max_train_steps: 200000
+  num_warmup_steps: 5000
+  optimizer:
+    betas:
+    - 0.9
+    - 0.95
+    eps: 1.0e-08
+    weight_decay: 0
+  save_interval: 1000
+  scheduler_specific_kwargs:
+    min_lr: 1.0e-06

InternVLPI05-0302-eep_2222_127000/dataset_statistics.json ADDED Viewed

	@@ -0,0 +1,218 @@

+{
+  "new_embodiment": {
+    "action": {
+      "mean": [
+        0.2627080635678384,
+        -0.06905352499339759,
+        0.19377399452271005,
+        -1.1311389931267308,
+        0.4074968476929972,
+        1.5050847338091942,
+        0.03278727958639783,
+        0.2358027420216991,
+        0.08325479407944988,
+        0.209077634157673,
+        1.521457871722598,
+        0.5131264127069904,
+        -1.5608658809815683,
+        0.03465066600831285
+      ],
+      "std": [
+        0.10375088171089163,
+        0.10887929577588172,
+        0.06680644047420393,
+        2.68255043659873,
+        0.3260696396232237,
+        2.3507239802774746,
+        0.028485141733389688,
+        0.09299172799800302,
+        0.081275375183015,
+        0.05484981855789096,
+        2.487506748874059,
+        0.2941890671188146,
+        2.3367093690706113,
+        0.02833451591418635
+      ],
+      "max": [
+        0.5931400060653687,
+        0.48442599177360535,
+        0.6720470190048218,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.0810599997639656,
+        0.5695070028305054,
+        0.4637550115585327,
+        0.6456500291824341,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.0611100010573864
+      ],
+      "min": [
+        -0.10788500308990479,
+        -0.5191159844398499,
+        0.040369000285863876,
+        -3.1410515308380127,
+        -1.0231120586395264,
+        -3.1410515308380127,
+        -0.0017500000540167093,
+        -0.03119499981403351,
+        -0.3384290039539337,
+        0.07246199995279312,
+        -3.1410515308380127,
+        -0.7706850171089172,
+        -3.1410515308380127,
+        0.0
+      ],
+      "q01": [
+        0.03489213060587645,
+        -0.36912800788879396,
+        0.07184209674596786,
+        -3.137246325016022,
+        -0.20070483744144438,
+        -3.137392144203186,
+        0.0,
+        0.030881709717214108,
+        -0.15914200246334076,
+        0.10170399993658066,
+        -3.138171911239624,
+        -0.11282174646854401,
+        -3.1362587141990663,
+        7.000000186963007e-05
+      ],
+      "q99": [
+        0.5304324626922607,
+        0.41213971734046934,
+        0.44856594711542136,
+        3.1415927410125732,
+        1.5365502309799193,
+        3.1415927410125732,
+        0.06019999831914902,
+        0.5246558457612991,
+        0.3517844846844672,
+        0.4130769228935239,
+        3.1415927410125732,
+        1.5435859155654907,
+        3.1415927410125732,
+        0.05992000177502632
+      ],
+      "mask": [
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false
+      ]
+    },
+    "state": {
+      "mean": [
+        0.2627080635678384,
+        -0.06905352499339759,
+        0.19377399452271005,
+        -1.1311389931267308,
+        0.4074968476929972,
+        1.5050847338091942,
+        0.03278727958639783,
+        0.2358027420216991,
+        0.08325479407944988,
+        0.209077634157673,
+        1.521457871722598,
+        0.5131264127069904,
+        -1.5608658809815683,
+        0.03465066600831285
+      ],
+      "std": [
+        0.10375088171089163,
+        0.10887929577588172,
+        0.06680644047420393,
+        2.68255043659873,
+        0.3260696396232237,
+        2.3507239802774746,
+        0.028485141733389688,
+        0.09299172799800302,
+        0.081275375183015,
+        0.05484981855789096,
+        2.487506748874059,
+        0.2941890671188146,
+        2.3367093690706113,
+        0.02833451591418635
+      ],
+      "max": [
+        0.5931400060653687,
+        0.48442599177360535,
+        0.6720470190048218,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.0810599997639656,
+        0.5695070028305054,
+        0.4637550115585327,
+        0.6456500291824341,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.0611100010573864
+      ],
+      "min": [
+        -0.10788500308990479,
+        -0.5191159844398499,
+        0.040369000285863876,
+        -3.1410515308380127,
+        -1.0231120586395264,
+        -3.1410515308380127,
+        -0.0017500000540167093,
+        -0.03119499981403351,
+        -0.3384290039539337,
+        0.07246199995279312,
+        -3.1410515308380127,
+        -0.7706850171089172,
+        -3.1410515308380127,
+        0.0
+      ],
+      "q01": [
+        0.03489213060587645,
+        -0.36912800788879396,
+        0.07184209674596786,
+        -3.137246325016022,
+        -0.20070483744144438,
+        -3.137392144203186,
+        0.0,
+        0.030881709717214108,
+        -0.15914200246334076,
+        0.10170399993658066,
+        -3.138171911239624,
+        -0.11282174646854401,
+        -3.1362587141990663,
+        7.000000186963007e-05
+      ],
+      "q99": [
+        0.5304324626922607,
+        0.41213971734046934,
+        0.44856594711542136,
+        3.1415927410125732,
+        1.5365502309799193,
+        3.1415927410125732,
+        0.06019999831914902,
+        0.5246558457612991,
+        0.3517844846844672,
+        0.4130769228935239,
+        3.1415927410125732,
+        1.5435859155654907,
+        3.1415927410125732,
+        0.05992000177502632
+      ]
+    },
+    "num_transitions": 2587963,
+    "num_trajectories": 1976
+  }
+}