Initial model upload

Browse files

Files changed (7) hide show

config.json +64 -0
experiment_cfg/metadata.json +433 -0
model-00001-of-00002.safetensors +3 -0
model-00002-of-00002.safetensors +3 -0
model.safetensors.index.json +0 -0
scheduler.pt +3 -0
trainer_state.json +174 -0

config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "action_dim": 32,
+  "action_head_cfg": {
+    "action_dim": 32,
+    "action_horizon": 16,
+    "add_pos_embed": true,
+    "backbone_embedding_dim": 2048,
+    "diffusion_model_cfg": {
+      "attention_head_dim": 48,
+      "cross_attention_dim": 2048,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "interleave_self_attention": true,
+      "norm_type": "ada_norm",
+      "num_attention_heads": 32,
+      "num_layers": 16,
+      "output_dim": 1024,
+      "positional_embeddings": null
+    },
+    "hidden_size": 1024,
+    "input_embedding_dim": 1536,
+    "max_action_dim": 32,
+    "max_state_dim": 64,
+    "model_dtype": "float32",
+    "noise_beta_alpha": 1.5,
+    "noise_beta_beta": 1.0,
+    "noise_s": 0.999,
+    "num_inference_timesteps": 4,
+    "num_target_vision_tokens": 32,
+    "num_timestep_buckets": 1000,
+    "tune_diffusion_model": true,
+    "tune_projector": true,
+    "use_vlln": true,
+    "vl_self_attention_cfg": {
+      "attention_head_dim": 64,
+      "dropout": 0.2,
+      "final_dropout": true,
+      "num_attention_heads": 32,
+      "num_layers": 4,
+      "positional_embeddings": null
+    }
+  },
+  "action_horizon": 16,
+  "architectures": [
+    "GR00T_N1_5"
+  ],
+  "attn_implementation": null,
+  "backbone_cfg": {
+    "eagle_path": "NVEagle/eagle_er-qwen3_1_7B-Siglip2_400M_stage1_5_128gpu_er_v7_1mlp_nops",
+    "load_bf16": false,
+    "project_to_dim": null,
+    "reproject_vision": false,
+    "select_layer": 12,
+    "tune_llm": false,
+    "tune_visual": true,
+    "use_flash_attention": true
+  },
+  "compute_dtype": "bfloat16",
+  "hidden_size": 2048,
+  "model_dtype": "float32",
+  "model_type": "gr00t_n1_5",
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.51.3"
+}

experiment_cfg/metadata.json ADDED Viewed

	@@ -0,0 +1,433 @@

+{
+    "libero_franka": {
+        "statistics": {
+            "state": {
+                "x": {
+                    "max": [
+                        0.14580604434013367
+                    ],
+                    "min": [
+                        -0.1765444278717041
+                    ],
+                    "mean": [
+                        -0.02999030612409115
+                    ],
+                    "std": [
+                        0.06694897264242172
+                    ],
+                    "q01": [
+                        -0.14911890715360643
+                    ],
+                    "q99": [
+                        0.09063626825809479
+                    ]
+                },
+                "y": {
+                    "max": [
+                        0.33216384053230286
+                    ],
+                    "min": [
+                        -0.29457300901412964
+                    ],
+                    "mean": [
+                        -0.007947085425257683
+                    ],
+                    "std": [
+                        0.17608462274074554
+                    ],
+                    "q01": [
+                        -0.25978428691625594
+                    ],
+                    "q99": [
+                        0.29066365867853167
+                    ]
+                },
+                "z": {
+                    "max": [
+                        0.3857804834842682
+                    ],
+                    "min": [
+                        0.008128180168569088
+                    ],
+                    "mean": [
+                        0.20293472707271576
+                    ],
+                    "std": [
+                        0.07807064801454544
+                    ],
+                    "q01": [
+                        0.009925739830359817
+                    ],
+                    "q99": [
+                        0.3370887073874472
+                    ]
+                },
+                "roll": {
+                    "max": [
+                        3.4003844261169434
+                    ],
+                    "min": [
+                        2.2890501022338867
+                    ],
+                    "mean": [
+                        3.1086409091949463
+                    ],
+                    "std": [
+                        0.0868484303355217
+                    ],
+                    "q01": [
+                        2.7545341420173646
+                    ],
+                    "q99": [
+                        3.2611824750900267
+                    ]
+                },
+                "pitch": {
+                    "max": [
+                        0.7954911589622498
+                    ],
+                    "min": [
+                        -1.883241891860962
+                    ],
+                    "mean": [
+                        -0.21404768526554108
+                    ],
+                    "std": [
+                        0.33540457487106323
+                    ],
+                    "q01": [
+                        -1.3996034812927245
+                    ],
+                    "q99": [
+                        0.32092821151018125
+                    ]
+                },
+                "yaw": {
+                    "max": [
+                        0.6642207503318787
+                    ],
+                    "min": [
+                        -1.0600427389144897
+                    ],
+                    "mean": [
+                        -0.11307074874639511
+                    ],
+                    "std": [
+                        0.20728276669979095
+                    ],
+                    "q01": [
+                        -0.6867720144987106
+                    ],
+                    "q99": [
+                        0.4037663781642913
+                    ]
+                },
+                "gripper": {
+                    "max": [
+                        0.04104341194033623,
+                        -0.00018117300351150334
+                    ],
+                    "min": [
+                        0.0006495157140307128,
+                        -0.041782498359680176
+                    ],
+                    "mean": [
+                        0.029380427673459053,
+                        -0.030556727200746536
+                    ],
+                    "std": [
+                        0.00956575945019722,
+                        0.009197483770549297
+                    ],
+                    "q01": [
+                        0.008197814421728254,
+                        -0.04015838988125324
+                    ],
+                    "q99": [
+                        0.039891827926039694,
+                        -0.009106044843792932
+                    ]
+                }
+            },
+            "action": {
+                "x": {
+                    "max": [
+                        0.9375
+                    ],
+                    "min": [
+                        -0.8839285969734192
+                    ],
+                    "mean": [
+                        0.07096529006958008
+                    ],
+                    "std": [
+                        0.2681235373020172
+                    ],
+                    "q01": [
+                        -0.5383928418159485
+                    ],
+                    "q99": [
+                        0.8464285731315613
+                    ]
+                },
+                "y": {
+                    "max": [
+                        0.8919642567634583
+                    ],
+                    "min": [
+                        -0.9375
+                    ],
+                    "mean": [
+                        0.13498851656913757
+                    ],
+                    "std": [
+                        0.43846824765205383
+                    ],
+                    "q01": [
+                        -0.8758928775787354
+                    ],
+                    "q99": [
+                        0.84375
+                    ]
+                },
+                "z": {
+                    "max": [
+                        0.9375
+                    ],
+                    "min": [
+                        -0.9375
+                    ],
+                    "mean": [
+                        -0.04601382836699486
+                    ],
+                    "std": [
+                        0.4474974274635315
+                    ],
+                    "q01": [
+                        -0.9375
+                    ],
+                    "q99": [
+                        0.9375
+                    ]
+                },
+                "roll": {
+                    "max": [
+                        0.17678570747375488
+                    ],
+                    "min": [
+                        -0.15000000596046448
+                    ],
+                    "mean": [
+                        0.00123520044144243
+                    ],
+                    "std": [
+                        0.024446550756692886
+                    ],
+                    "q01": [
+                        -0.06964285671710968
+                    ],
+                    "q99": [
+                        0.08142857253551483
+                    ]
+                },
+                "pitch": {
+                    "max": [
+                        0.35035714507102966
+                    ],
+                    "min": [
+                        -0.29035714268684387
+                    ],
+                    "mean": [
+                        0.006998839322477579
+                    ],
+                    "std": [
+                        0.049355510622262955
+                    ],
+                    "q01": [
+                        -0.11678571254014969
+                    ],
+                    "q99": [
+                        0.14892856776714325
+                    ]
+                },
+                "yaw": {
+                    "max": [
+                        0.1810714304447174
+                    ],
+                    "min": [
+                        -0.32892856001853943
+                    ],
+                    "mean": [
+                        -0.015027612447738647
+                    ],
+                    "std": [
+                        0.042107198387384415
+                    ],
+                    "q01": [
+                        -0.15964286029338837
+                    ],
+                    "q99": [
+                        0.0867857113480568
+                    ]
+                },
+                "gripper": {
+                    "max": [
+                        1.0
+                    ],
+                    "min": [
+                        0.0
+                    ],
+                    "mean": [
+                        0.46428999304771423
+                    ],
+                    "std": [
+                        0.49879148602485657
+                    ],
+                    "q01": [
+                        0.0
+                    ],
+                    "q99": [
+                        1.0
+                    ]
+                }
+            }
+        },
+        "modalities": {
+            "video": {
+                "image": {
+                    "resolution": [
+                        256,
+                        256
+                    ],
+                    "channels": 3,
+                    "fps": 20.0
+                },
+                "wrist_image": {
+                    "resolution": [
+                        256,
+                        256
+                    ],
+                    "channels": 3,
+                    "fps": 20.0
+                }
+            },
+            "state": {
+                "x": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "y": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "z": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "roll": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "pitch": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "yaw": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "gripper": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        2
+                    ],
+                    "continuous": true
+                }
+            },
+            "action": {
+                "x": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "y": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "z": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "roll": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "pitch": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "yaw": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                },
+                "gripper": {
+                    "absolute": true,
+                    "rotation_type": null,
+                    "shape": [
+                        1
+                    ],
+                    "continuous": true
+                }
+            }
+        },
+        "embodiment_tag": "libero_franka"
+    }
+}

model-00001-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:636066fca40fbd69b0b2c4d160ee0f9656c565c161d5f1c5b3a1acfe05944dae
+size 4999367032

model-00002-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b4917b473d89d5a31af802fe4e40e0dbe73866a938b9cd39fd1bbb9b6d55eec0
+size 2586705312

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d2d754412c61116546142914503e7369d0cc35d3c380a07e5218f595d76b6d96
+size 1064

trainer_state.json ADDED Viewed

	@@ -0,0 +1,174 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 3.0303030303030303,
+  "eval_steps": 500,
+  "global_step": 200,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.15151515151515152,
+      "grad_norm": 1.0779532194137573,
+      "learning_rate": 9e-05,
+      "loss": 0.5809,
+      "step": 10
+    },
+    {
+      "epoch": 0.30303030303030304,
+      "grad_norm": 1.257666826248169,
+      "learning_rate": 9.944739353007344e-05,
+      "loss": 0.2898,
+      "step": 20
+    },
+    {
+      "epoch": 0.45454545454545453,
+      "grad_norm": 1.1526721715927124,
+      "learning_rate": 9.755282581475769e-05,
+      "loss": 0.1944,
+      "step": 30
+    },
+    {
+      "epoch": 0.6060606060606061,
+      "grad_norm": 0.740468442440033,
+      "learning_rate": 9.43611409721806e-05,
+      "loss": 0.1489,
+      "step": 40
+    },
+    {
+      "epoch": 0.7575757575757576,
+      "grad_norm": 0.5122345089912415,
+      "learning_rate": 8.995939984474624e-05,
+      "loss": 0.1241,
+      "step": 50
+    },
+    {
+      "epoch": 0.9090909090909091,
+      "grad_norm": 0.3294401168823242,
+      "learning_rate": 8.44676704559283e-05,
+      "loss": 0.1162,
+      "step": 60
+    },
+    {
+      "epoch": 1.0606060606060606,
+      "grad_norm": 0.3713489770889282,
+      "learning_rate": 7.803575286758364e-05,
+      "loss": 0.105,
+      "step": 70
+    },
+    {
+      "epoch": 1.2121212121212122,
+      "grad_norm": 0.38999056816101074,
+      "learning_rate": 7.083909302476453e-05,
+      "loss": 0.102,
+      "step": 80
+    },
+    {
+      "epoch": 1.3636363636363638,
+      "grad_norm": 0.313165545463562,
+      "learning_rate": 6.307399704769099e-05,
+      "loss": 0.0917,
+      "step": 90
+    },
+    {
+      "epoch": 1.5151515151515151,
+      "grad_norm": 0.2271764725446701,
+      "learning_rate": 5.495227651252315e-05,
+      "loss": 0.0896,
+      "step": 100
+    },
+    {
+      "epoch": 1.6666666666666665,
+      "grad_norm": 0.2582443356513977,
+      "learning_rate": 4.669547078371504e-05,
+      "loss": 0.0906,
+      "step": 110
+    },
+    {
+      "epoch": 1.8181818181818183,
+      "grad_norm": 0.28969135880470276,
+      "learning_rate": 3.852880399766243e-05,
+      "loss": 0.0898,
+      "step": 120
+    },
+    {
+      "epoch": 1.9696969696969697,
+      "grad_norm": 0.21474944055080414,
+      "learning_rate": 3.0675041535377405e-05,
+      "loss": 0.0858,
+      "step": 130
+    },
+    {
+      "epoch": 2.121212121212121,
+      "grad_norm": 0.17501652240753174,
+      "learning_rate": 2.3348413563600325e-05,
+      "loss": 0.0827,
+      "step": 140
+    },
+    {
+      "epoch": 2.2727272727272725,
+      "grad_norm": 0.17531634867191315,
+      "learning_rate": 1.6748771394307585e-05,
+      "loss": 0.0835,
+      "step": 150
+    },
+    {
+      "epoch": 2.4242424242424243,
+      "grad_norm": 0.1865883618593216,
+      "learning_rate": 1.1056136061894384e-05,
+      "loss": 0.0795,
+      "step": 160
+    },
+    {
+      "epoch": 2.5757575757575757,
+      "grad_norm": 0.23194383084774017,
+      "learning_rate": 6.425787818636131e-06,
+      "loss": 0.0871,
+      "step": 170
+    },
+    {
+      "epoch": 2.7272727272727275,
+      "grad_norm": 0.15936115384101868,
+      "learning_rate": 2.9840304941919415e-06,
+      "loss": 0.0838,
+      "step": 180
+    },
+    {
+      "epoch": 2.878787878787879,
+      "grad_norm": 0.18423740565776825,
+      "learning_rate": 8.247462563808817e-07,
+      "loss": 0.0791,
+      "step": 190
+    },
+    {
+      "epoch": 3.0303030303030303,
+      "grad_norm": 0.13376280665397644,
+      "learning_rate": 6.834750376549792e-09,
+      "loss": 0.0796,
+      "step": 200
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 200,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 40,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0.0,
+  "train_batch_size": 128,
+  "trial_name": null,
+  "trial_params": null
+}