Upload model checkpoint (7 files, 20.6 GB)

Browse files

Files changed (7) hide show

config.json +120 -0
model-00001-of-00005.safetensors +3 -0
model-00002-of-00005.safetensors +3 -0
model-00003-of-00005.safetensors +3 -0
model-00004-of-00005.safetensors +3 -0
model-00005-of-00005.safetensors +3 -0
model.safetensors.index.json +0 -0

config.json ADDED Viewed

	@@ -0,0 +1,120 @@

+{
+  "action_in_proj_cfg": {
+    "_target_": "alpamayo1_5.models.action_in_proj.PerWaypointActionInProjV2",
+    "hidden_size": 512,
+    "max_freq": 100.0,
+    "num_enc_layers": 2,
+    "num_fourier_feats": 20
+  },
+  "action_out_proj_cfg": {
+    "_target_": "torch.nn.Linear"
+  },
+  "action_space_cfg": {
+    "_target_": "alpamayo1_5.action_space.UnicycleAccelCurvatureActionSpace",
+    "a_lambda": 0.0001,
+    "a_ridge": 0.0001,
+    "accel_bounds": [
+      -9.8,
+      9.8
+    ],
+    "accel_mean": 0.02902694707164455,
+    "accel_std": 0.6810426736454882,
+    "curvature_bounds": [
+      -0.33,
+      0.33
+    ],
+    "curvature_mean": 0.0002692167976330542,
+    "curvature_std": 0.026148280660833106,
+    "dt": 0.1,
+    "kappa_lambda": 0.0001,
+    "kappa_ridge": 0.0001,
+    "n_waypoints": 64,
+    "theta_lambda": 1e-06,
+    "theta_ridge": 1e-08,
+    "v_lambda": 1e-06,
+    "v_ridge": 0.0001
+  },
+  "architectures": [
+    "Alpamayo1_5"
+  ],
+  "attn_implementation": "flash_attention_2",
+  "diffusion_cfg": {
+    "_target_": "alpamayo1_5.diffusion.flow_matching.FlowMatching",
+    "int_method": "euler",
+    "x_dims": null
+  },
+  "dtype": "bfloat16",
+  "expert_cfg": {
+    "head_dim": 128,
+    "hidden_size": 2048,
+    "intermediate_size": 8256,
+    "num_attention_heads": 16
+  },
+  "expert_non_causal_attention": true,
+  "hist_traj_tokenizer_cfg": {
+    "_target_": "alpamayo1_5.models.delta_tokenizer.DeltaTrajectoryTokenizer"
+  },
+  "include_camera_ids": true,
+  "include_frame_nums": true,
+  "keep_same_dtype": true,
+  "max_pixels": 196608,
+  "min_pixels": 163840,
+  "model_dtype": "bfloat16",
+  "model_type": "alpamayo1_5",
+  "padding_side": "left",
+  "tokens_per_future_traj": 128,
+  "tokens_per_history_traj": 48,
+  "traj_token_ids": {
+    "future": 155685,
+    "future_end": 155683,
+    "future_start": 155681,
+    "history": 155684,
+    "history_end": 155676,
+    "history_start": 155674
+  },
+  "traj_token_start_idx": 151669,
+  "traj_tokenizer_cfg": {
+    "_recursive_": false,
+    "_target_": "alpamayo1_5.action_space.discrete_action_space.DiscreteTrajectoryTokenizer",
+    "action_space_cfg": {
+      "_target_": "alpamayo1_5.action_space.UnicycleAccelCurvatureActionSpace",
+      "a_lambda": 0.0001,
+      "a_ridge": 0.0001,
+      "accel_bounds": [
+        -9.8,
+        9.8
+      ],
+      "accel_mean": 0.02902694707164455,
+      "accel_std": 0.6810426736454882,
+      "curvature_bounds": [
+        -0.33,
+        0.33
+      ],
+      "curvature_mean": 0.0002692167976330542,
+      "curvature_std": 0.026148280660833106,
+      "dt": 0.1,
+      "kappa_lambda": 0.0001,
+      "kappa_ridge": 0.0001,
+      "n_waypoints": 64,
+      "theta_lambda": 1e-06,
+      "theta_ridge": 1e-08,
+      "v_lambda": 1e-06,
+      "v_ridge": 0.0001
+    },
+    "dims_max": [
+      10,
+      10
+    ],
+    "dims_min": [
+      -10,
+      -10
+    ],
+    "num_bins": 3000
+  },
+  "traj_vocab_size": 4000,
+  "transformers_version": "4.57.1",
+  "vlm_backend": "qwenvl3",
+  "vlm_name_or_path": "nvidia/Cosmos-Reason2-8B",
+  "vocab_size": 155697,
+  "add_special_tokens": true
+}

model-00001-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:537259bb56815f9dfdcb028d5606e84dff5ab0c8e0e559782d63d91b6671d15c
+size 4928204944

model-00002-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:18841e5049b7836c16c034123ae6d40b2ff0414f9f77008bc7ca72490302a47b
+size 4915963032

model-00003-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e8953b27fe827a60604a006b07ab1216fe766375f9926d1c3bd5ecee84ecef78
+size 4983071160

model-00004-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:604f0c0f19986f363a23a1e0b5736eedadd231ca285beab28d5db968a1d37602
+size 4980341192

model-00005-of-00005.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d889c09634e5a21b4c957957ede2cdab4418c268ee1d870c1f942d04242adf6
+size 2349614196

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff