initial commit

Browse files

Files changed (4) hide show

checkpoints/step-080000-epoch-09-loss=0.0408.pt +3 -0
config.json +32 -0
config.yaml +29 -0
dataset_statistics.json +127 -0

checkpoints/step-080000-epoch-09-loss=0.0408.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c0e3a4f007e31fdc849cbf730f709c5358ffa5fa45ff324c299afd144c5a1de
+size 30165309772

config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "train_reasoner": true,
+  "use_fast_tokenizer": false,
+  "vla": {
+    "action_tokenizer": "action_tokenizer",
+    "base_vlm": "prism-dinosiglip-224px+7b",
+    "data_mix": "bridge",
+    "enable_gradient_checkpointing": true,
+    "enable_mixed_precision_training": true,
+    "epochs": 1000,
+    "expected_world_size": 8,
+    "freeze_llm_backbone": false,
+    "freeze_vision_backbone": false,
+    "global_batch_size": 256,
+    "image_sequence_len": 1,
+    "learning_rate": 2e-05,
+    "lr_scheduler_type": "constant",
+    "max_grad_norm": 1.0,
+    "max_steps": null,
+    "per_device_batch_size": 32,
+    "reduce_in_full_precision": true,
+    "save_every_n_steps": 25000,
+    "shuffle_buffer_size": 256000,
+    "train_strategy": "fsdp-full-shard",
+    "type": "prism-dinosiglip-224px+mx-bridge",
+    "unfreeze_last_llm_layer": false,
+    "use_wrist_image": false,
+    "vla_id": "prism-dinosiglip-224px+mx-bridge",
+    "warmup_ratio": 0.0,
+    "weight_decay": 0.0
+  }
+}

config.yaml ADDED Viewed

	@@ -0,0 +1,29 @@

+train_reasoner: true
+use_fast_tokenizer: false
+vla:
+  action_tokenizer: action_tokenizer
+  base_vlm: prism-dinosiglip-224px+7b
+  data_mix: bridge
+  enable_gradient_checkpointing: true
+  enable_mixed_precision_training: true
+  epochs: 1000
+  expected_world_size: 8
+  freeze_llm_backbone: false
+  freeze_vision_backbone: false
+  global_batch_size: 256
+  image_sequence_len: 1
+  learning_rate: 2.0e-05
+  lr_scheduler_type: constant
+  max_grad_norm: 1.0
+  max_steps: null
+  per_device_batch_size: 32
+  reduce_in_full_precision: true
+  save_every_n_steps: 25000
+  shuffle_buffer_size: 256000
+  train_strategy: fsdp-full-shard
+  type: prism-dinosiglip-224px+mx-bridge
+  unfreeze_last_llm_layer: false
+  use_wrist_image: false
+  vla_id: prism-dinosiglip-224px+mx-bridge
+  warmup_ratio: 0.0
+  weight_decay: 0.0

dataset_statistics.json ADDED Viewed

	@@ -0,0 +1,127 @@

+{
+  "bridge_orig": {
+    "action": {
+      "mean": [
+        0.00023341993801295757,
+        0.00013004825450479984,
+        -0.00012762498226948082,
+        -0.00015565630747005343,
+        -0.0004039340128656477,
+        0.00023557698295917362,
+        0.5764579772949219
+      ],
+      "std": [
+        0.00976591743528843,
+        0.013689151965081692,
+        0.012667378410696983,
+        0.028534315526485443,
+        0.030638020485639572,
+        0.07691382616758347,
+        0.49737095832824707
+      ],
+      "max": [
+        0.41691166162490845,
+        0.25864794850349426,
+        0.21218234300613403,
+        3.122201919555664,
+        1.8618112802505493,
+        6.280478477478027,
+        1.0
+      ],
+      "min": [
+        -0.4007510244846344,
+        -0.13874775171279907,
+        -0.22553899884223938,
+        -3.2010786533355713,
+        -1.8618112802505493,
+        -6.279075622558594,
+        0.0
+      ],
+      "q01": [
+        -0.02872725307941437,
+        -0.04170349963009357,
+        -0.026093858778476715,
+        -0.08092105075716972,
+        -0.09288699507713317,
+        -0.20718276381492615,
+        0.0
+      ],
+      "q99": [
+        0.028309678435325586,
+        0.040855254605412394,
+        0.040161586627364146,
+        0.08192047759890528,
+        0.07792850524187081,
+        0.20382574498653397,
+        1.0
+      ],
+      "mask": [
+        true,
+        true,
+        true,
+        true,
+        true,
+        true,
+        false
+      ]
+    },
+    "proprio": {
+      "mean": [
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0
+      ],
+      "std": [
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0
+      ],
+      "max": [
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0
+      ],
+      "min": [
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0
+      ],
+      "q01": [
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0
+      ],
+      "q99": [
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0
+      ]
+    },
+    "num_transitions": 2135463,
+    "num_trajectories": 60064
+  }
+}