jian001 commited on
Commit
f40e02c
·
verified ·
1 Parent(s): 92f19fc

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +62 -0
  2. config.json +8 -8
  3. model.safetensors +2 -2
  4. train_config.json +12 -12
README.md ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ datasets: jian001/record-GRC1
3
+ library_name: lerobot
4
+ license: apache-2.0
5
+ model_name: diffusion
6
+ pipeline_tag: robotics
7
+ tags:
8
+ - robotics
9
+ - diffusion
10
+ - lerobot
11
+ ---
12
+
13
+ # Model Card for diffusion
14
+
15
+ <!-- Provide a quick summary of what the model is/does. -->
16
+
17
+
18
+ [Diffusion Policy](https://huggingface.co/papers/2303.04137) treats visuomotor control as a generative diffusion process, producing smooth, multi-step action trajectories that excel at contact-rich manipulation.
19
+
20
+
21
+ This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).
22
+ See the full documentation at [LeRobot Docs](https://huggingface.co/docs/lerobot/index).
23
+
24
+ ---
25
+
26
+ ## How to Get Started with the Model
27
+
28
+ For a complete walkthrough, see the [training guide](https://huggingface.co/docs/lerobot/il_robots#train-a-policy).
29
+ Below is the short version on how to train and run inference/eval:
30
+
31
+ ### Train from scratch
32
+
33
+ ```bash
34
+ python -m lerobot.scripts.train \
35
+ --dataset.repo_id=${HF_USER}/<dataset> \
36
+ --policy.type=act \
37
+ --output_dir=outputs/train/<desired_policy_repo_id> \
38
+ --job_name=lerobot_training \
39
+ --policy.device=cuda \
40
+ --policy.repo_id=${HF_USER}/<desired_policy_repo_id>
41
+ --wandb.enable=true
42
+ ```
43
+
44
+ *Writes checkpoints to `outputs/train/<desired_policy_repo_id>/checkpoints/`.*
45
+
46
+ ### Evaluate the policy/run inference
47
+
48
+ ```bash
49
+ python -m lerobot.record \
50
+ --robot.type=so100_follower \
51
+ --dataset.repo_id=<hf_user>/eval_<dataset> \
52
+ --policy.path=<hf_user>/<desired_policy_repo_id> \
53
+ --episodes=10
54
+ ```
55
+
56
+ Prefix the dataset repo with **eval\_** and supply `--policy.path` pointing to a local or hub checkpoint.
57
+
58
+ ---
59
+
60
+ ## Model Details
61
+
62
+ * **License:** apache-2.0
config.json CHANGED
@@ -41,17 +41,17 @@
41
  "device": "cuda",
42
  "use_amp": false,
43
  "push_to_hub": true,
44
- "repo_id": "/diffusion_so101_GRC1_model",
45
  "private": null,
46
  "tags": null,
47
  "license": null,
48
- "horizon": 16,
49
- "n_action_steps": 8,
50
  "drop_n_last_frames": 7,
51
  "vision_backbone": "resnet18",
52
  "crop_shape": [
53
- 84,
54
- 84
55
  ],
56
  "crop_is_random": true,
57
  "pretrained_backbone_weights": null,
@@ -59,16 +59,16 @@
59
  "spatial_softmax_num_keypoints": 32,
60
  "use_separate_rgb_encoder_per_camera": false,
61
  "down_dims": [
 
62
  512,
63
- 1024,
64
- 2048
65
  ],
66
  "kernel_size": 5,
67
  "n_groups": 8,
68
  "diffusion_step_embed_dim": 128,
69
  "use_film_scale_modulation": true,
70
  "noise_scheduler_type": "DDPM",
71
- "num_train_timesteps": 100,
72
  "beta_schedule": "squaredcos_cap_v2",
73
  "beta_start": 0.0001,
74
  "beta_end": 0.02,
 
41
  "device": "cuda",
42
  "use_amp": false,
43
  "push_to_hub": true,
44
+ "repo_id": "jian001/diffusion_so101_GRC1",
45
  "private": null,
46
  "tags": null,
47
  "license": null,
48
+ "horizon": 8,
49
+ "n_action_steps": 6,
50
  "drop_n_last_frames": 7,
51
  "vision_backbone": "resnet18",
52
  "crop_shape": [
53
+ 64,
54
+ 64
55
  ],
56
  "crop_is_random": true,
57
  "pretrained_backbone_weights": null,
 
59
  "spatial_softmax_num_keypoints": 32,
60
  "use_separate_rgb_encoder_per_camera": false,
61
  "down_dims": [
62
+ 256,
63
  512,
64
+ 1024
 
65
  ],
66
  "kernel_size": 5,
67
  "n_groups": 8,
68
  "diffusion_step_embed_dim": 128,
69
  "use_film_scale_modulation": true,
70
  "noise_scheduler_type": "DDPM",
71
+ "num_train_timesteps": 40,
72
  "beta_schedule": "squaredcos_cap_v2",
73
  "beta_start": 0.0001,
74
  "beta_end": 0.02,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d08e1b92d168a6edfad4019ee5de0a9fc9f02402d458d0edfd7c41222f8844d5
3
- size 1066517736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9958dca125c1e7046fc7053ed7f10c686e90d439766aed8a30eacd7d09c70e4
3
+ size 312135688
train_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "dataset": {
3
- "repo_id": "/record-GRC1",
4
  "root": "/home/shitao/.cache/huggingface/lerobot/jian001/record-GRC1",
5
  "episodes": null,
6
  "image_transforms": {
@@ -108,17 +108,17 @@
108
  "device": "cuda",
109
  "use_amp": false,
110
  "push_to_hub": true,
111
- "repo_id": "/diffusion_so101_GRC1_model",
112
  "private": null,
113
  "tags": null,
114
  "license": null,
115
- "horizon": 16,
116
- "n_action_steps": 8,
117
  "drop_n_last_frames": 7,
118
  "vision_backbone": "resnet18",
119
  "crop_shape": [
120
- 84,
121
- 84
122
  ],
123
  "crop_is_random": true,
124
  "pretrained_backbone_weights": null,
@@ -126,16 +126,16 @@
126
  "spatial_softmax_num_keypoints": 32,
127
  "use_separate_rgb_encoder_per_camera": false,
128
  "down_dims": [
 
129
  512,
130
- 1024,
131
- 2048
132
  ],
133
  "kernel_size": 5,
134
  "n_groups": 8,
135
  "diffusion_step_embed_dim": 128,
136
  "use_film_scale_modulation": true,
137
  "noise_scheduler_type": "DDPM",
138
- "num_train_timesteps": 100,
139
  "beta_schedule": "squaredcos_cap_v2",
140
  "beta_start": 0.0001,
141
  "beta_end": 0.02,
@@ -159,8 +159,8 @@
159
  "resume": false,
160
  "seed": 1000,
161
  "num_workers": 4,
162
- "batch_size": 8,
163
- "steps": 100000,
164
  "eval_freq": 20000,
165
  "log_freq": 200,
166
  "save_checkpoint": true,
@@ -193,7 +193,7 @@
193
  "project": "lerobot",
194
  "entity": null,
195
  "notes": null,
196
- "run_id": "tiea7xim",
197
  "mode": null
198
  }
199
  }
 
1
  {
2
  "dataset": {
3
+ "repo_id": "jian001/record-GRC1",
4
  "root": "/home/shitao/.cache/huggingface/lerobot/jian001/record-GRC1",
5
  "episodes": null,
6
  "image_transforms": {
 
108
  "device": "cuda",
109
  "use_amp": false,
110
  "push_to_hub": true,
111
+ "repo_id": "jian001/diffusion_so101_GRC1",
112
  "private": null,
113
  "tags": null,
114
  "license": null,
115
+ "horizon": 8,
116
+ "n_action_steps": 6,
117
  "drop_n_last_frames": 7,
118
  "vision_backbone": "resnet18",
119
  "crop_shape": [
120
+ 64,
121
+ 64
122
  ],
123
  "crop_is_random": true,
124
  "pretrained_backbone_weights": null,
 
126
  "spatial_softmax_num_keypoints": 32,
127
  "use_separate_rgb_encoder_per_camera": false,
128
  "down_dims": [
129
+ 256,
130
  512,
131
+ 1024
 
132
  ],
133
  "kernel_size": 5,
134
  "n_groups": 8,
135
  "diffusion_step_embed_dim": 128,
136
  "use_film_scale_modulation": true,
137
  "noise_scheduler_type": "DDPM",
138
+ "num_train_timesteps": 40,
139
  "beta_schedule": "squaredcos_cap_v2",
140
  "beta_start": 0.0001,
141
  "beta_end": 0.02,
 
159
  "resume": false,
160
  "seed": 1000,
161
  "num_workers": 4,
162
+ "batch_size": 12,
163
+ "steps": 30000,
164
  "eval_freq": 20000,
165
  "log_freq": 200,
166
  "save_checkpoint": true,
 
193
  "project": "lerobot",
194
  "entity": null,
195
  "notes": null,
196
+ "run_id": "nmle884x",
197
  "mode": null
198
  }
199
  }