Initial model upload

Browse files

Files changed (5) hide show

config.json +64 -0
experiment_cfg/metadata.json +433 -0
model.safetensors +3 -0
scheduler.pt +3 -0
trainer_state.json +90 -0

config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "action_dim": 32,
+  "action_head_cfg": {
+    "action_dim": 32,
+    "action_horizon": 16,
+    "add_pos_embed": true,
+    "backbone_embedding_dim": 2048,
+    "diffusion_model_cfg": {
+      "attention_head_dim": 48,
+      "cross_attention_dim": 2048,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "interleave_self_attention": true,
+      "norm_type": "ada_norm",
+      "num_attention_heads": 32,
+      "num_layers": 16,
+      "output_dim": 1024,
+      "positional_embeddings": null
+    },
+    "hidden_size": 1024,
+    "input_embedding_dim": 1536,
+    "max_action_dim": 32,
+    "max_state_dim": 64,
+    "model_dtype": "float32",
+    "noise_beta_alpha": 1.5,
+    "noise_beta_beta": 1.0,
+    "noise_s": 0.999,
+    "num_inference_timesteps": 4,
+    "num_target_vision_tokens": 32,
+    "num_timestep_buckets": 1000,
+    "tune_diffusion_model": true,
+    "tune_projector": true,
+    "use_vlln": true,
+    "vl_self_attention_cfg": {
+      "attention_head_dim": 64,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "num_attention_heads": 32,
+      "num_layers": 4,
+      "positional_embeddings": null
+    }
+  },
+  "action_horizon": 16,
+  "architectures": [
+    "GR00T_N1_5"
+  ],
+  "attn_implementation": null,
+  "backbone_cfg": {
+    "eagle_path": "NVEagle/eagle_er-qwen3_1_7B-Siglip2_400M_stage1_5_128gpu_er_v7_1mlp_nops",
+    "load_bf16": false,
+    "project_to_dim": null,
+    "reproject_vision": false,
+    "select_layer": 12,
+    "tune_llm": false,
+    "tune_visual": true,
+    "use_flash_attention": true
+  },
+  "compute_dtype": "bfloat16",
+  "hidden_size": 2048,
+  "model_dtype": "float32",
+  "model_type": "gr00t_n1_5",
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.51.3"
+}

experiment_cfg/metadata.json ADDED Viewed

	@@ -0,0 +1,433 @@

+{
+    "libero_franka": {
+        "statistics": {
+            "state": {
+                "x": {
+                    "max": [
+                        0.1759040206670761
+                    ],
+                    "min": [
+                        -0.3095473051071167
+                    ],
+                    "mean": [
+                        -0.024462558329105377
+                    ],
+                    "std": [
+                        0.1101478561758995
+                    ],
+                    "q01": [
+                        -0.2727657300233841
+                    ],
+                    "q99": [
+                        0.13529365032911292
+                    ]
+                },
+                "y": {
+                    "max": [
+                        0.3904820382595062
+                    ],
+                    "min": [
+                        -0.29250794649124146
+                    ],
+                    "mean": [
+                        0.106529600918293
+                    ],
+                    "std": [
+                        0.13784688711166382
+                    ],
+                    "q01": [
+                        -0.23721413239836692
+                    ],
+                    "q99": [
+                        0.3629165390133857
+                    ]
+                },
+                "z": {
+                    "max": [
+                        1.3290715217590332
+                    ],
+                    "min": [
+                        0.9095591306686401
+                    ],
+                    "mean": [
+                        1.0580483675003052
+                    ],
+                    "std": [
+                        0.1044282391667366
+                    ],
+                    "q01": [
+                        0.9160063165426254
+                    ],
+                    "q99": [
+                        1.2862326657772063
+                    ]
+                },
+                "roll": {
+                    "max": [
+                        3.4566118717193604
+                    ],
+                    "min": [
+                        2.497488260269165
+                    ],
+                    "mean": [
+                        3.0628468990325928
+                    ],
+                    "std": [
+                        0.10451053828001022
+                    ],
+                    "q01": [
+                        2.77949666261673
+                    ],
+                    "q99": [
+                        3.2829698753356933
+                    ]
+                },
+                "pitch": {
+                    "max": [
+                        1.2268599271774292
+                    ],
+                    "min": [
+                        -1.8006486892700195
+                    ],
+                    "mean": [
+                        -0.10464039444923401
+                    ],
+                    "std": [
+                        0.4112098217010498
+                    ],
+                    "q01": [
+                        -1.3187511622905732
+                    ],
+                    "q99": [
+                        0.9332760351896285
+                    ]
+                },
+                "yaw": {
+                    "max": [
+                        1.0429412126541138
+                    ],
+                    "min": [
+                        -0.7207611203193665
+                    ],
+                    "mean": [
+                        0.08307311683893204
+                    ],
+                    "std": [
+                        0.2176690548658371
+                    ],
+                    "q01": [
+                        -0.41989982962608335
+                    ],
+                    "q99": [
+                        0.6325724506378171
+                    ]
+                },
+                "gripper": {
+                    "max": [
+                        0.041053611785173416,
+                        0.000775813648942858
+                    ],
+                    "min": [
+                        -0.0004703797458205372,
+                        -0.041536275297403336
+                    ],
+                    "mean": [
+                        0.01995457336306572,
+                        -0.020162804052233696
+                    ],
+                    "std": [
+                        0.017260896041989326,
+                        0.0171116404235363
+                    ],
+                    "q01": [
+                        0.001503719249740243,
+                        -0.03989770736545324
+                    ],
+                    "q99": [
+                        0.039933966137468815,
+                        -0.001671919699292631
+                    ]
+                }
+            },
+            "action": {
+                "x": {
+                    "max": [
+                        0.9375
+                    ],
+                    "min": [
+                        -0.9375
+                    ],
+                    "mean": [
+                        0.15312479436397552
+                    ],
+                    "std": [
+                        0.41272708773612976
+                    ],
+                    "q01": [
+                        -0.7454732114076613
+                    ],
+                    "q99": [
+                        0.9375
+                    ]
+                },
+                "y": {
+                    "max": [
+                        0.9375
+                    ],
+                    "min": [
+                        -0.9375
+                    ],
+                    "mean": [
+                        0.13707277178764343
+                    ],
+                    "std": [
+                        0.34724321961402893
+                    ],
+                    "q01": [
+                        -0.6616071462631226
+                    ],
+                    "q99": [
+                        0.8758928775787354
+                    ]
+                },
+                "z": {
+                    "max": [
+                        0.9375
+                    ],
+                    "min": [
+                        -0.9375
+                    ],
+                    "mean": [
+                        -0.15526802837848663
+                    ],
+                    "std": [
+                        0.50869220495224
+                    ],
+                    "q01": [
+                        -0.9375
+                    ],
+                    "q99": [
+                        0.9321428537368774
+                    ]
+                },
+                "roll": {
+                    "max": [
+                        0.1971428543329239
+                    ],
+                    "min": [
+                        -0.1875
+                    ],
+                    "mean": [
+                        -0.005176450591534376
+                    ],
+                    "std": [
+                        0.037266165018081665
+                    ],
+                    "q01": [
+                        -0.1071428582072258
+                    ],
+                    "q99": [
+                        0.1039285734295845
+                    ]
+                },
+                "pitch": {
+                    "max": [
+                        0.33642858266830444
+                    ],
+                    "min": [
+                        -0.3675000071525574
+                    ],
+                    "mean": [
+                        -0.01120874285697937
+                    ],
+                    "std": [
+                        0.07244449853897095
+                    ],
+                    "q01": [
+                        -0.20678570866584778
+                    ],
+                    "q99": [
+                        0.17678570747375488
+                    ]
+                },
+                "yaw": {
+                    "max": [
+                        0.375
+                    ],
+                    "min": [
+                        -0.36000001430511475
+                    ],
+                    "mean": [
+                        -0.020194264128804207
+                    ],
+                    "std": [
+                        0.05762382969260216
+                    ],
+                    "q01": [
+                        -0.1842857152223587
+                    ],
+                    "q99": [
+                        0.14571428298950195
+                    ]
+                },
+                "gripper": {
+                    "max": [
+                        1.0
+                    ],
+                    "min": [
+                        0.0
+                    ],
+                    "mean": [
+                        0.4578818082809448
+                    ],
+                    "std": [
+                        0.49827873706817627
+                    ],
+                    "q01": [
+                        0.0
+                    ],
+                    "q99": [
+                        1.0
+                    ]
+                }
+            }
+        },
+        "modalities": {
+            "video": {
+                "image": {
+                    "resolution": [
+                        256,
+                        256
+                    ],
+                    "channels": 3,
+                    "fps": 20.0
+                },
+                "wrist_image": {
+                    "resolution": [
+                        256,
+                        256
+                    ],
+                    "channels": 3,
+                    "fps": 20.0
+                }
+            },
+            "state": {
+                "x": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "y": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "z": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "roll": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "pitch": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "yaw": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "gripper": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        2
+                    ],
+                    "continuous": true
+                }
+            },
+            "action": {
+                "x": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "y": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "z": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "roll": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "pitch": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "yaw": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "gripper": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                }
+            }
+        },
+        "embodiment_tag": "libero_franka"
+    }
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83984aabcad10167d417285c1718c1d5a3807cf2f8b991c6815dcd781756aec6
+size 5449839514

scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da226c44306b9d44cb710a3e43a9625a10e7d1c86f899d409c15432084a7060b
+size 1064

trainer_state.json ADDED Viewed

	@@ -0,0 +1,90 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.5384615384615383,
+  "eval_steps": 500,
+  "global_step": 80,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.19230769230769232,
+      "grad_norm": 1.0270750522613525,
+      "learning_rate": 9.956320346634876e-05,
+      "loss": 0.5994,
+      "step": 10
+    },
+    {
+      "epoch": 0.38461538461538464,
+      "grad_norm": 1.0943247079849243,
+      "learning_rate": 9.473646649103818e-05,
+      "loss": 0.306,
+      "step": 20
+    },
+    {
+      "epoch": 0.5769230769230769,
+      "grad_norm": 0.8214321732521057,
+      "learning_rate": 8.506183921362443e-05,
+      "loss": 0.2207,
+      "step": 30
+    },
+    {
+      "epoch": 0.7692307692307693,
+      "grad_norm": 0.7468852400779724,
+      "learning_rate": 7.158771761692464e-05,
+      "loss": 0.1827,
+      "step": 40
+    },
+    {
+      "epoch": 0.9615384615384616,
+      "grad_norm": 0.5866342782974243,
+      "learning_rate": 5.577423184847932e-05,
+      "loss": 0.1552,
+      "step": 50
+    },
+    {
+      "epoch": 1.1538461538461537,
+      "grad_norm": 0.3692125678062439,
+      "learning_rate": 3.933501846281267e-05,
+      "loss": 0.1458,
+      "step": 60
+    },
+    {
+      "epoch": 1.3461538461538463,
+      "grad_norm": 0.33734169602394104,
+      "learning_rate": 2.405152131093926e-05,
+      "loss": 0.1356,
+      "step": 70
+    },
+    {
+      "epoch": 1.5384615384615383,
+      "grad_norm": 0.29717421531677246,
+      "learning_rate": 1.157994445715706e-05,
+      "loss": 0.1356,
+      "step": 80
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 100,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 20,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0.0,
+  "train_batch_size": 128,
+  "trial_name": null,
+  "trial_params": null
+}