ehalicki
/

lewam-so101-pretrained

Model card Files Files and versions

ehalicki commited on 24 days ago

Commit

7d061b3

·

verified ·

1 Parent(s): 6303227

Upload LeWAM weights

Files changed (3) hide show

README.md +1 -0
config.json +65 -15
model.safetensors +2 -2

README.md CHANGED Viewed

@@ -14,6 +14,7 @@ Joint video-action flow-matching model for robot control.
 - **Context frames**: 32 @ 5 fps
 - **Future frames**: 8
 - **Action dim**: 6 @ 30 fps
 ## Usage

 - **Context frames**: 32 @ 5 fps
 - **Future frames**: 8
 - **Action dim**: 6 @ 30 fps
+- **Cameras**: image1, image2
 ## Usage

config.json CHANGED Viewed

@@ -1,17 +1,67 @@
 {
-  "model_dim": 512,
-  "depth": 12,
-  "num_heads": 8,
-  "num_context_frames": 32,
-  "num_future_frames": 8,
-  "frame_latent_h": 14,
-  "frame_latent_w": 14,
-  "fps": 5,
-  "action_fps": 30,
-  "action_dim": 6,
-  "state_dim": 6,
-  "vlm_model_id": "HuggingFaceTB/SmolVLM2-256M-Video-Instruct",
-  "vlm_num_layers": 4,
-  "norm_strategy": "q2_q98",
-  "mlp_ratio": 4.0
 }

 {
+    "type": "lewam",
+    "n_obs_steps": 1,
+    "input_features": {
+        "observation.images.image1": {
+            "type": "VISUAL",
+            "shape": [
+                3,
+                480,
+                640
+            ]
+        },
+        "observation.images.image2": {
+            "type": "VISUAL",
+            "shape": [
+                3,
+                480,
+                640
+            ]
+        },
+        "observation.state": {
+            "type": "STATE",
+            "shape": [
+                6
+            ]
+        }
+    },
+    "output_features": {
+        "action": {
+            "type": "ACTION",
+            "shape": [
+                6
+            ]
+        }
+    },
+    "device": "cuda",
+    "use_amp": false,
+    "use_peft": false,
+    "push_to_hub": true,
+    "repo_id": null,
+    "private": null,
+    "tags": null,
+    "license": null,
+    "pretrained_path": null,
+    "model_dim": 512,
+    "depth": 12,
+    "num_heads": 8,
+    "mlp_ratio": 4.0,
+    "vlm_model_id": "HuggingFaceTB/SmolVLM2-256M-Video-Instruct",
+    "vlm_num_layers": 4,
+    "norm_strategy": "q2_q98",
+    "num_ode_steps": 10,
+    "smooth_actions": true,
+    "crop_size": 224,
+    "fps": 5,
+    "action_fps": 30,
+    "num_context_frames": 32,
+    "num_future_frames": 8,
+    "n_action_steps": 48,
+    "action_weight": 1.0,
+    "lang_drop_rate": 0.1,
+    "normalization_mapping": {
+        "VISUAL": "IDENTITY",
+        "STATE": "IDENTITY",
+        "ACTION": "IDENTITY"
+    }
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:522e9cb9059b69ae1499d527e164673f6c845b6e388961f7573e3e01f638b111
-size 1280453152

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc8fa5a7451494a22ed9bd3f18262402c86dc6f55b568ccc6945d82296330a04
+size 1280458528