Safetensors
mayasg commited on
Commit
94807a0
·
verified ·
1 Parent(s): 52a2562

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +69 -5
README.md CHANGED
@@ -1,5 +1,69 @@
1
- ---
2
- license: other
3
- license_name: other
4
- license_link: LICENSE
5
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ license_name: other
4
+ license_link: LICENSE
5
+ ---
6
+ # MolmoBot-SPOC-RBY1Articulated
7
+
8
+ [[Paper](https://arxiv.org/pdf/2603.16861)] [[Project Website](https://allenai.github.io/MolmoBot)] [[Code](https://github.com/allenai/MolmoBot/tree/main/MolmoBot-SPOC)] [[Data](https://huggingface.co/datasets/allenai/molmobot-data)]
9
+
10
+ MolmoBot-SPOC-RBY1Articulated is the MolmoBot-SPOC model trained on simulation data on the RB-Y1 platform, **without any real robot data**. See [here](https://github.com/allenai/MolmoBot/tree/main/MolmoBot-SPOC) for usage instructions.
11
+
12
+ ## Quickstart
13
+
14
+
15
+ ```python
16
+ import numpy as np
17
+ from huggingface_hub import snapshot_download
18
+ from molmobot_spoc.eval.config.rby1_eval_config import RBY1EvalBaseConfig
19
+ from molmobot_spoc.eval.config.spoc_policy_configs import SPOCRBY1ArticulatedManipPolicyConfig
20
+ from molmobot_spoc.eval.spoc_policy import SPOCModelPolicy
21
+
22
+
23
+ ckpt_dir = snapshot_download("allenai/MolmoBot-SPOC-RBY1Articulated")
24
+ policy_config = SPOCRBY1ArticulatedManipPolicyConfig(checkpoint_dir=ckpt_dir)
25
+ config = RBY1EvalBaseConfig(
26
+ policy_config=policy_config, task_type="open"
27
+ ) # Try with "door_open" too!
28
+
29
+ policy = SPOCModelPolicy(config, config.task_type)
30
+
31
+ obs = {
32
+ "head_camera": np.zeros((576, 768, 3), dtype=np.uint8),
33
+ "wrist_camera_r": np.zeros((576, 768, 3), dtype=np.uint8),
34
+ "wrist_camera_l": np.zeros((576, 768, 3), dtype=np.uint8),
35
+ "qpos": {
36
+ "left_arm": np.zeros((7,), dtype=np.float32),
37
+ "right_arm": np.zeros((7,), dtype=np.float32),
38
+ "torso": np.zeros((6,), dtype=np.float32),
39
+ "left_gripper": np.zeros((2,), dtype=np.float32),
40
+ "right_gripper": np.zeros((2,), dtype=np.float32),
41
+ },
42
+ "goal": "open the drawer",
43
+ "object_image_points": {
44
+ "pickup_obj": { # NOTE: Use "pickup_obj" for open tasks, "door_handle" for door_open tasks.
45
+ "head_camera": {
46
+ "points": [[0.45, 0.52]] # list of [x, y] candidates; one is sampled at runtime
47
+ }
48
+ }
49
+ }
50
+ }
51
+ # NOTE: get_action saves an internal buffer with the chunk and returns actions 1 by 1. To get the whole chunk, use model_output_to_action
52
+ # NOTE: the policy internally saves the first frame to ground the image point with
53
+ action = policy.get_action(obs)
54
+ print(action)
55
+ ```
56
+
57
+ ## BibTeX
58
+
59
+ ```
60
+ @misc{deshpande2026molmobot,
61
+ title={MolmoB0T: Large-Scale Simulation Enables Zero-Shot Manipulation},
62
+ author={Abhay Deshpande and Maya Guru and Rose Hendrix and Snehal Jauhri and Ainaz Eftekhar and Rohun Tripathi and Max Argus and Jordi Salvador and Haoquan Fang and Matthew Wallingford and Wilbert Pumacay and Yejin Kim and Quinn Pfeifer and Ying-Chun Lee and Piper Wolters and Omar Rayyan and Mingtong Zhang and Jiafei Duan and Karen Farley and Winson Han and Eli Vanderbilt and Dieter Fox and Ali Farhadi and Georgia Chalvatzaki and Dhruv Shah and Ranjay Krishna},
63
+ year={2026},
64
+ eprint={2603.16861},
65
+ archivePrefix={arXiv},
66
+ primaryClass={cs.RO},
67
+ url={https://arxiv.org/abs/2603.16861},
68
+ }
69
+ ```