romanrab commited on
Commit
e5fcf67
·
verified ·
1 Parent(s): 04ced39

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +62 -0
  2. config.json +4 -4
  3. model.safetensors +2 -2
  4. train_config.json +7 -7
README.md ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ datasets: romanrab/battery_box_right_arm_150
3
+ library_name: lerobot
4
+ license: apache-2.0
5
+ model_name: diffusion
6
+ pipeline_tag: robotics
7
+ tags:
8
+ - lerobot
9
+ - robotics
10
+ - diffusion
11
+ ---
12
+
13
+ # Model Card for diffusion
14
+
15
+ <!-- Provide a quick summary of what the model is/does. -->
16
+
17
+
18
+ [Diffusion Policy](https://huggingface.co/papers/2303.04137) treats visuomotor control as a generative diffusion process, producing smooth, multi-step action trajectories that excel at contact-rich manipulation.
19
+
20
+
21
+ This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
22
+ See the full documentation at [LeRobot Docs](https://huggingface.co/docs/lerobot/index).
23
+
24
+ ---
25
+
26
+ ## How to Get Started with the Model
27
+
28
+ For a complete walkthrough, see the [training guide](https://huggingface.co/docs/lerobot/il_robots#train-a-policy).
29
+ Below is the short version on how to train and run inference/eval:
30
+
31
+ ### Train from scratch
32
+
33
+ ```bash
34
+ python -m lerobot.scripts.train \
35
+ --dataset.repo_id=${HF_USER}/<dataset> \
36
+ --policy.type=act \
37
+ --output_dir=outputs/train/<desired_policy_repo_id> \
38
+ --job_name=lerobot_training \
39
+ --policy.device=cuda \
40
+ --policy.repo_id=${HF_USER}/<desired_policy_repo_id>
41
+ --wandb.enable=true
42
+ ```
43
+
44
+ _Writes checkpoints to `outputs/train/<desired_policy_repo_id>/checkpoints/`._
45
+
46
+ ### Evaluate the policy/run inference
47
+
48
+ ```bash
49
+ python -m lerobot.record \
50
+ --robot.type=so100_follower \
51
+ --dataset.repo_id=<hf_user>/eval_<dataset> \
52
+ --policy.path=<hf_user>/<desired_policy_repo_id> \
53
+ --episodes=10
54
+ ```
55
+
56
+ Prefix the dataset repo with **eval\_** and supply `--policy.path` pointing to a local or hub checkpoint.
57
+
58
+ ---
59
+
60
+ ## Model Details
61
+
62
+ - **License:** apache-2.0
config.json CHANGED
@@ -50,8 +50,8 @@
50
  "drop_n_last_frames": 7,
51
  "vision_backbone": "resnet18",
52
  "crop_shape": [
53
- 84,
54
- 84
55
  ],
56
  "crop_is_random": true,
57
  "pretrained_backbone_weights": null,
@@ -59,9 +59,9 @@
59
  "spatial_softmax_num_keypoints": 32,
60
  "use_separate_rgb_encoder_per_camera": true,
61
  "down_dims": [
 
62
  512,
63
- 1024,
64
- 2048
65
  ],
66
  "kernel_size": 5,
67
  "n_groups": 8,
 
50
  "drop_n_last_frames": 7,
51
  "vision_backbone": "resnet18",
52
  "crop_shape": [
53
+ 64,
54
+ 64
55
  ],
56
  "crop_is_random": true,
57
  "pretrained_backbone_weights": null,
 
59
  "spatial_softmax_num_keypoints": 32,
60
  "use_separate_rgb_encoder_per_camera": true,
61
  "down_dims": [
62
+ 256,
63
  512,
64
+ 1024
 
65
  ],
66
  "kernel_size": 5,
67
  "n_groups": 8,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6924ce9e8318f2a5d3f8b49ca9dfcbdc22d7ab8ef69bcd1a471f3b61d9979fb4
3
- size 1114998460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4475cdbac7d779f85360ea6911e1913870aaf1bb58dfd35f90cad32e55170955
3
+ size 358774204
train_config.json CHANGED
@@ -117,8 +117,8 @@
117
  "drop_n_last_frames": 7,
118
  "vision_backbone": "resnet18",
119
  "crop_shape": [
120
- 84,
121
- 84
122
  ],
123
  "crop_is_random": true,
124
  "pretrained_backbone_weights": null,
@@ -126,9 +126,9 @@
126
  "spatial_softmax_num_keypoints": 32,
127
  "use_separate_rgb_encoder_per_camera": true,
128
  "down_dims": [
 
129
  512,
130
- 1024,
131
- 2048
132
  ],
133
  "kernel_size": 5,
134
  "n_groups": 8,
@@ -159,12 +159,12 @@
159
  "resume": false,
160
  "seed": 1000,
161
  "num_workers": 4,
162
- "batch_size": 64,
163
- "steps": 50000,
164
  "eval_freq": 20000,
165
  "log_freq": 100,
166
  "save_checkpoint": true,
167
- "save_freq": 5000,
168
  "use_policy_training_preset": true,
169
  "optimizer": {
170
  "type": "adam",
 
117
  "drop_n_last_frames": 7,
118
  "vision_backbone": "resnet18",
119
  "crop_shape": [
120
+ 64,
121
+ 64
122
  ],
123
  "crop_is_random": true,
124
  "pretrained_backbone_weights": null,
 
126
  "spatial_softmax_num_keypoints": 32,
127
  "use_separate_rgb_encoder_per_camera": true,
128
  "down_dims": [
129
+ 256,
130
  512,
131
+ 1024
 
132
  ],
133
  "kernel_size": 5,
134
  "n_groups": 8,
 
159
  "resume": false,
160
  "seed": 1000,
161
  "num_workers": 4,
162
+ "batch_size": 32,
163
+ "steps": 15000,
164
  "eval_freq": 20000,
165
  "log_freq": 100,
166
  "save_checkpoint": true,
167
+ "save_freq": 2500,
168
  "use_policy_training_preset": true,
169
  "optimizer": {
170
  "type": "adam",