Xiaoyan97 commited on
Commit
d4c4caa
·
verified ·
1 Parent(s): 0935506

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. config.json +13 -6
  3. model.safetensors +1 -1
  4. train_config.json +16 -9
README.md CHANGED
@@ -6,8 +6,8 @@ model_name: pi05
6
  pipeline_tag: robotics
7
  tags:
8
  - robotics
9
- - lerobot
10
  - pi05
 
11
  ---
12
 
13
  # Model Card for pi05
 
6
  pipeline_tag: robotics
7
  tags:
8
  - robotics
 
9
  - pi05
10
+ - lerobot
11
  ---
12
 
13
  # Model Card for pi05
config.json CHANGED
@@ -49,7 +49,7 @@
49
  "private": null,
50
  "tags": null,
51
  "license": null,
52
- "pretrained_path": "lerobot/pi05_base",
53
  "paligemma_variant": "gemma_2b",
54
  "action_expert_variant": "gemma_300m",
55
  "dtype": "bfloat16",
@@ -64,7 +64,14 @@
64
  "time_sampling_offset": 0.001,
65
  "min_period": 0.004,
66
  "max_period": 4.0,
67
- "rtc_config": null,
 
 
 
 
 
 
 
68
  "image_resolution": [
69
  224,
70
  224
@@ -81,7 +88,7 @@
81
  "compile_mode": "max-autotune",
82
  "freeze_vision_encoder": false,
83
  "train_expert_only": false,
84
- "optimizer_lr": 2.5e-05,
85
  "optimizer_betas": [
86
  0.9,
87
  0.95
@@ -89,7 +96,7 @@
89
  "optimizer_eps": 1e-08,
90
  "optimizer_weight_decay": 0.01,
91
  "optimizer_grad_clip_norm": 1.0,
92
- "scheduler_warmup_steps": 1000,
93
- "scheduler_decay_steps": 30000,
94
- "scheduler_decay_lr": 2.5e-06
95
  }
 
49
  "private": null,
50
  "tags": null,
51
  "license": null,
52
+ "pretrained_path": "outputs/pi05_training/checkpoints/last/pretrained_model",
53
  "paligemma_variant": "gemma_2b",
54
  "action_expert_variant": "gemma_300m",
55
  "dtype": "bfloat16",
 
64
  "time_sampling_offset": 0.001,
65
  "min_period": 0.004,
66
  "max_period": 4.0,
67
+ "rtc_config": {
68
+ "enabled": true,
69
+ "prefix_attention_schedule": "LINEAR",
70
+ "max_guidance_weight": 10.0,
71
+ "execution_horizon": 10,
72
+ "debug": false,
73
+ "debug_maxlen": 100
74
+ },
75
  "image_resolution": [
76
  224,
77
  224
 
88
  "compile_mode": "max-autotune",
89
  "freeze_vision_encoder": false,
90
  "train_expert_only": false,
91
+ "optimizer_lr": 5e-05,
92
  "optimizer_betas": [
93
  0.9,
94
  0.95
 
96
  "optimizer_eps": 1e-08,
97
  "optimizer_weight_decay": 0.01,
98
  "optimizer_grad_clip_norm": 1.0,
99
+ "scheduler_warmup_steps": 5000,
100
+ "scheduler_decay_steps": 25000,
101
+ "scheduler_decay_lr": 5e-05
102
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fc2ace1799de79abe223e8c6b83125bcb8f975823ce8d09b0cbce2ec7d069e5
3
  size 7473096344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc0f99055c88a962604e1efae09e46e9392995ea7c4cbaa91f42bb02961fd541
3
  size 7473096344
train_config.json CHANGED
@@ -131,7 +131,7 @@
131
  "private": null,
132
  "tags": null,
133
  "license": null,
134
- "pretrained_path": "lerobot/pi05_base",
135
  "paligemma_variant": "gemma_2b",
136
  "action_expert_variant": "gemma_300m",
137
  "dtype": "bfloat16",
@@ -146,7 +146,14 @@
146
  "time_sampling_offset": 0.001,
147
  "min_period": 0.004,
148
  "max_period": 4.0,
149
- "rtc_config": null,
 
 
 
 
 
 
 
150
  "image_resolution": [
151
  224,
152
  224
@@ -163,7 +170,7 @@
163
  "compile_mode": "max-autotune",
164
  "freeze_vision_encoder": false,
165
  "train_expert_only": false,
166
- "optimizer_lr": 2.5e-05,
167
  "optimizer_betas": [
168
  0.9,
169
  0.95
@@ -171,17 +178,17 @@
171
  "optimizer_eps": 1e-08,
172
  "optimizer_weight_decay": 0.01,
173
  "optimizer_grad_clip_norm": 1.0,
174
- "scheduler_warmup_steps": 1000,
175
- "scheduler_decay_steps": 30000,
176
- "scheduler_decay_lr": 2.5e-06
177
  },
178
  "output_dir": "outputs/pi05_training",
179
  "job_name": "pi05_training",
180
- "resume": false,
181
  "seed": 1000,
182
  "num_workers": 4,
183
  "batch_size": 8,
184
- "steps": 30000,
185
  "eval_freq": 20000,
186
  "log_freq": 200,
187
  "tolerance_s": 0.0001,
@@ -232,5 +239,5 @@
232
  "rabc_epsilon": 1e-06,
233
  "rabc_head_mode": "sparse",
234
  "rename_map": {},
235
- "checkpoint_path": null
236
  }
 
131
  "private": null,
132
  "tags": null,
133
  "license": null,
134
+ "pretrained_path": "outputs/pi05_training/checkpoints/last/pretrained_model",
135
  "paligemma_variant": "gemma_2b",
136
  "action_expert_variant": "gemma_300m",
137
  "dtype": "bfloat16",
 
146
  "time_sampling_offset": 0.001,
147
  "min_period": 0.004,
148
  "max_period": 4.0,
149
+ "rtc_config": {
150
+ "enabled": true,
151
+ "prefix_attention_schedule": "LINEAR",
152
+ "max_guidance_weight": 10.0,
153
+ "execution_horizon": 10,
154
+ "debug": false,
155
+ "debug_maxlen": 100
156
+ },
157
  "image_resolution": [
158
  224,
159
  224
 
170
  "compile_mode": "max-autotune",
171
  "freeze_vision_encoder": false,
172
  "train_expert_only": false,
173
+ "optimizer_lr": 5e-05,
174
  "optimizer_betas": [
175
  0.9,
176
  0.95
 
178
  "optimizer_eps": 1e-08,
179
  "optimizer_weight_decay": 0.01,
180
  "optimizer_grad_clip_norm": 1.0,
181
+ "scheduler_warmup_steps": 5000,
182
+ "scheduler_decay_steps": 25000,
183
+ "scheduler_decay_lr": 5e-05
184
  },
185
  "output_dir": "outputs/pi05_training",
186
  "job_name": "pi05_training",
187
+ "resume": true,
188
  "seed": 1000,
189
  "num_workers": 4,
190
  "batch_size": 8,
191
+ "steps": 300000,
192
  "eval_freq": 20000,
193
  "log_freq": 200,
194
  "tolerance_s": 0.0001,
 
239
  "rabc_epsilon": 1e-06,
240
  "rabc_head_mode": "sparse",
241
  "rename_map": {},
242
+ "checkpoint_path": "outputs/pi05_training/checkpoints/last"
243
  }