Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

internpi-0127-eep-small/config.json +106 -0
internpi-0127-eep-small/config.yaml +67 -0
internpi-0127-eep-small/dataset_statistics.json +218 -0

internpi-0127-eep-small/config.json ADDED Viewed

	@@ -0,0 +1,106 @@

+{
+  "run_id": "InternVLPI-0127-eep-test",
+  "run_root_dir": "/lumos-vePFS/shenzhen/models/lumos_pi",
+  "seed": 42,
+  "trackers": [
+    "jsonl"
+  ],
+  "wandb_entity": null,
+  "wandb_project": null,
+  "is_debug": false,
+  "framework": {
+    "name": "internvlPI",
+    "qwenvl": {
+      "base_vlm": "/lumos-vePFS/shenzhen/models/InternVL3_5-1B-Instruct",
+      "attn_implementation": "eager",
+      "vl_hidden_dim": 2048
+    },
+    "action_model": {
+      "add_pos_embed": true,
+      "hidden_size": 1024,
+      "max_seq_len": 1024,
+      "action_model_type": "DiT-B",
+      "action_dim": 20,
+      "state_dim": 20,
+      "future_action_window_size": 15,
+      "past_action_window_size": 0,
+      "action_horizon": 30,
+      "repeated_diffusion_steps": 2,
+      "noise_beta_alpha": 1.5,
+      "noise_beta_beta": 1.0,
+      "noise_s": 0.999,
+      "num_timestep_buckets": 1000,
+      "num_inference_timesteps": 8,
+      "num_target_vision_tokens": 32,
+      "use_scaled_noise": true,
+      "diffusion_model_cfg": {
+        "dropout": 0.2,
+        "final_dropout": true,
+        "interleave_self_attention": true,
+        "norm_type": "ada_norm",
+        "num_layers": 28,
+        "output_dim": 2560,
+        "positional_embeddings": null
+      },
+      "smoothness_loss_weight": 1
+    }
+  },
+  "datasets": {
+    "vla_data": {
+      "dataset_py": "lerobot_datasets",
+      "data_root_dir": "/lumos-vePFS/shenzhen/data/data_warehouse/data_warehouse_output",
+      "data_mix": "train_QwenPI",
+      "per_device_batch_size": 4,
+      "num_workers": 2,
+      "action_type": "abs_ee",
+      "image_size": [
+        480,
+        360
+      ],
+      "video_backend": "pyav"
+    }
+  },
+  "trainer": {
+    "epochs": 100,
+    "max_train_steps": 35000,
+    "num_warmup_steps": 5000,
+    "save_interval": 1000,
+    "eval_interval": 100000,
+    "learning_rate": {
+      "base": 1e-05,
+      "intern_vl_interface": 1e-05,
+      "action_model": 0.0001
+    },
+    "lr_scheduler_type": "cosine_with_min_lr",
+    "scheduler_specific_kwargs": {
+      "min_lr": 1e-06
+    },
+    "freeze_modules": null,
+    "loss_scale": {
+      "vla": 1.0,
+      "vlm": 0.05
+    },
+    "max_grad_norm": 1.0,
+    "warmup_ratio": 0.1,
+    "weight_decay": 0.0,
+    "logging_frequency": 10,
+    "gradient_clipping": 1.0,
+    "gradient_accumulation_steps": 2,
+    "optimizer": {
+      "name": "AdamW",
+      "betas": [
+        0.9,
+        0.95
+      ],
+      "eps": 1e-08,
+      "weight_decay": 0
+    }
+  },
+  "is_resume": true,
+  "resume_epoch": null,
+  "resume_step": 5000,
+  "enable_gradient_checkpointing": true,
+  "enable_mixed_precision_training": true,
+  "report_to": "jsonl",
+  "output_dir": "/lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI-0127-eep-test"
+}

internpi-0127-eep-small/config.yaml ADDED Viewed

	@@ -0,0 +1,67 @@

+datasets:
+  vla_data:
+    data_mix: train_QwenPI
+    data_root_dir: /lumos-vePFS/shenzhen/data/data_warehouse/data_warehouse_output
+    dataset_py: lerobot_datasets
+    image_size:
+    - 480
+    - 360
+    per_device_batch_size: 4
+    video_backend: pyav
+framework:
+  action_model:
+    action_dim: 20
+    add_pos_embed: true
+    diffusion_model_cfg:
+      dropout: 0.2
+      final_dropout: true
+      interleave_self_attention: true
+      norm_type: ada_norm
+      num_layers: 28
+      output_dim: 2560
+      positional_embeddings: null
+    future_action_window_size: 15
+    hidden_dim: 1024
+    max_seq_len: 1024
+    noise_beta_alpha: 1.5
+    noise_beta_beta: 1.0
+    noise_s: 0.999
+    num_inference_timesteps: 8
+    num_target_vision_tokens: 32
+    num_timestep_buckets: 1000
+    past_action_window_size: 0
+    smoothness_loss_weight: 1
+    state_dim: 20
+    use_scaled_noise: true
+  name: internvlPI
+  qwenvl:
+    attn_implementation: eager
+    base_vlm: /lumos-vePFS/shenzhen/models/InternVL3_5-1B-Instruct
+    num_vl_layers: 28
+    vl_hidden_dim: 1024
+output_dir: /lumos-vePFS/shenzhen/models/lumos_pi/InternVLPI-0127-eep-test
+run_id: InternVLPI-0127-eep-test
+run_root_dir: /lumos-vePFS/shenzhen/models/lumos_pi
+seed: 42
+trainer:
+  eval_interval: 100000
+  freeze_modules: null
+  gradient_accumulation_steps: 2
+  gradient_clipping: 1.0
+  learning_rate:
+    action_model: 0.0001
+    base: 1.0e-05
+    intern_vl_interface: 1.0e-05
+  logging_frequency: 10
+  lr_scheduler_type: cosine_with_min_lr
+  max_train_steps: 35000
+  num_warmup_steps: 5000
+  optimizer:
+    betas:
+    - 0.9
+    - 0.95
+    eps: 1.0e-08
+    weight_decay: 0
+  save_interval: 1000
+  scheduler_specific_kwargs:
+    min_lr: 1.0e-06

internpi-0127-eep-small/dataset_statistics.json ADDED Viewed

	@@ -0,0 +1,218 @@

+{
+  "new_embodiment": {
+    "action": {
+      "mean": [
+        0.24831613898277283,
+        0.027144895866513252,
+        0.22650116682052612,
+        -0.8404249548912048,
+        0.5109900832176208,
+        0.3438127040863037,
+        0.05076254904270172,
+        0.27124547958374023,
+        0.1341637223958969,
+        0.23118293285369873,
+        0.5084952116012573,
+        0.7631425261497498,
+        -1.8881397247314453,
+        0.04549280181527138
+      ],
+      "std": [
+        0.08048900961875916,
+        0.11851683259010315,
+        0.05085735768079758,
+        2.8058412075042725,
+        0.3912830650806427,
+        2.907383441925049,
+        0.02002296969294548,
+        0.10783883184194565,
+        0.09286945313215256,
+        0.05440365895628929,
+        2.881397008895874,
+        0.2646803855895996,
+        1.884290337562561,
+        0.023190317675471306
+      ],
+      "max": [
+        0.4355350136756897,
+        0.42503198981285095,
+        0.4411650002002716,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.059709999710321426,
+        0.528249979019165,
+        0.4351179897785187,
+        0.4433180093765259,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.05992000177502632
+      ],
+      "min": [
+        0.042451001703739166,
+        -0.21000799536705017,
+        0.11678700149059296,
+        -3.1410341262817383,
+        -0.282882958650589,
+        -3.141016721725464,
+        0.0005600000149570405,
+        0.0038419999182224274,
+        -0.10948000103235245,
+        0.09222699701786041,
+        -3.1410515308380127,
+        0.1244419738650322,
+        -3.1410515308380127,
+        7.000000186963007e-05
+      ],
+      "q01": [
+        0.05619199946522713,
+        -0.17355053395032882,
+        0.13174245327711107,
+        -3.133350660800934,
+        -0.1359262466430664,
+        -3.1331721353530884,
+        0.000699999975040555,
+        0.05602800101041794,
+        -0.03544915910810232,
+        0.11746856845915318,
+        -3.1342583203315737,
+        0.2646872201561928,
+        -3.1262485551834107,
+        0.0002800000074785203
+      ],
+      "q99": [
+        0.3960674390196795,
+        0.35788134992122633,
+        0.3558399733901022,
+        3.1415927410125732,
+        1.5315977966785421,
+        3.1415927410125732,
+        0.05964000150561333,
+        0.48414370894432057,
+        0.3517844846844672,
+        0.36821531414985653,
+        3.1415927410125732,
+        1.5277097356319418,
+        3.1415927410125732,
+        0.05992000177502632
+      ],
+      "mask": [
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false,
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false
+      ]
+    },
+    "state": {
+      "mean": [
+        0.24831613898277283,
+        0.027144895866513252,
+        0.22650116682052612,
+        -0.8404249548912048,
+        0.5109900832176208,
+        0.3438127040863037,
+        0.05076254904270172,
+        0.27124547958374023,
+        0.1341637223958969,
+        0.23118293285369873,
+        0.5084952116012573,
+        0.7631425261497498,
+        -1.8881397247314453,
+        0.04549280181527138
+      ],
+      "std": [
+        0.08048900961875916,
+        0.11851683259010315,
+        0.05085735768079758,
+        2.8058412075042725,
+        0.3912830650806427,
+        2.907383441925049,
+        0.02002296969294548,
+        0.10783883184194565,
+        0.09286945313215256,
+        0.05440365895628929,
+        2.881397008895874,
+        0.2646803855895996,
+        1.884290337562561,
+        0.023190317675471306
+      ],
+      "max": [
+        0.4355350136756897,
+        0.42503198981285095,
+        0.4411650002002716,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.059709999710321426,
+        0.528249979019165,
+        0.4351179897785187,
+        0.4433180093765259,
+        3.1415927410125732,
+        1.5707963705062866,
+        3.1415927410125732,
+        0.05992000177502632
+      ],
+      "min": [
+        0.042451001703739166,
+        -0.21000799536705017,
+        0.11678700149059296,
+        -3.1410341262817383,
+        -0.282882958650589,
+        -3.141016721725464,
+        0.0005600000149570405,
+        0.0038419999182224274,
+        -0.10948000103235245,
+        0.09222699701786041,
+        -3.1410515308380127,
+        0.1244419738650322,
+        -3.1410515308380127,
+        7.000000186963007e-05
+      ],
+      "q01": [
+        0.05619199946522713,
+        -0.17355053395032882,
+        0.13174245327711107,
+        -3.133350660800934,
+        -0.1359262466430664,
+        -3.1331721353530884,
+        0.000699999975040555,
+        0.05602800101041794,
+        -0.03544915910810232,
+        0.11746856845915318,
+        -3.1342583203315737,
+        0.2646872201561928,
+        -3.1262485551834107,
+        0.0002800000074785203
+      ],
+      "q99": [
+        0.3960674390196795,
+        0.35788134992122633,
+        0.3558399733901022,
+        3.1415927410125732,
+        1.5315977966785421,
+        3.1415927410125732,
+        0.05964000150561333,
+        0.48414370894432057,
+        0.3517844846844672,
+        0.36821531414985653,
+        3.1415927410125732,
+        1.5277097356319418,
+        3.1415927410125732,
+        0.05992000177502632
+      ]
+    },
+    "num_transitions": 34124,
+    "num_trajectories": 52
+  }
+}