alexhegit commited on
Commit
9f55434
·
verified ·
1 Parent(s): ebee6cd

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +2 -2
  2. config.json +5 -5
  3. model.safetensors +2 -2
  4. train_config.json +17 -17
README.md CHANGED
@@ -1,13 +1,13 @@
1
  ---
2
- datasets: alexhegit/starai_lab1
3
  library_name: lerobot
4
  license: apache-2.0
5
  model_name: pi0
6
  pipeline_tag: robotics
7
  tags:
8
- - robotics
9
  - lerobot
10
  - pi0
 
11
  ---
12
 
13
  # Model Card for pi0
 
1
  ---
2
+ datasets: alexhegit/so101_lab1
3
  library_name: lerobot
4
  license: apache-2.0
5
  model_name: pi0
6
  pipeline_tag: robotics
7
  tags:
 
8
  - lerobot
9
  - pi0
10
+ - robotics
11
  ---
12
 
13
  # Model Card for pi0
config.json CHANGED
@@ -5,7 +5,7 @@
5
  "observation.state": {
6
  "type": "STATE",
7
  "shape": [
8
- 7
9
  ]
10
  },
11
  "observation.images.top": {
@@ -29,7 +29,7 @@
29
  "action": {
30
  "type": "ACTION",
31
  "shape": [
32
- 7
33
  ]
34
  }
35
  },
@@ -40,10 +40,10 @@
40
  "private": null,
41
  "tags": null,
42
  "license": null,
43
- "pretrained_path": "outputs/train/pi0_starai_lab1/checkpoints/last/pretrained_model",
44
  "paligemma_variant": "gemma_2b",
45
  "action_expert_variant": "gemma_300m",
46
- "dtype": "float32",
47
  "chunk_size": 50,
48
  "n_action_steps": 50,
49
  "max_state_dim": 32,
@@ -68,7 +68,7 @@
68
  "gradient_checkpointing": false,
69
  "compile_model": false,
70
  "compile_mode": "max-autotune",
71
- "optimizer_lr": 1e-05,
72
  "optimizer_betas": [
73
  0.9,
74
  0.95
 
5
  "observation.state": {
6
  "type": "STATE",
7
  "shape": [
8
+ 6
9
  ]
10
  },
11
  "observation.images.top": {
 
29
  "action": {
30
  "type": "ACTION",
31
  "shape": [
32
+ 6
33
  ]
34
  }
35
  },
 
40
  "private": null,
41
  "tags": null,
42
  "license": null,
43
+ "pretrained_path": "lerobot/pi0_base",
44
  "paligemma_variant": "gemma_2b",
45
  "action_expert_variant": "gemma_300m",
46
+ "dtype": "bfloat16",
47
  "chunk_size": 50,
48
  "n_action_steps": 50,
49
  "max_state_dim": 32,
 
68
  "gradient_checkpointing": false,
69
  "compile_model": false,
70
  "compile_mode": "max-autotune",
71
+ "optimizer_lr": 2.5e-05,
72
  "optimizer_betas": [
73
  0.9,
74
  0.95
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6918d5c9ed64247673e84bb570624b83d859a9e5f034a49ba13d91298206f27e
3
- size 14005623256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae7efd956c041810a03b862713d5fcf38260936eeb4ff524b358861d8c7d744e
3
+ size 7011548640
train_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "dataset": {
3
- "repo_id": "alexhegit/starai_lab1",
4
- "root": "/ws/dataset/starai_dataset/",
5
  "episodes": null,
6
  "image_transforms": {
7
  "enable": false,
@@ -87,7 +87,7 @@
87
  "observation.state": {
88
  "type": "STATE",
89
  "shape": [
90
- 7
91
  ]
92
  },
93
  "observation.images.top": {
@@ -111,7 +111,7 @@
111
  "action": {
112
  "type": "ACTION",
113
  "shape": [
114
- 7
115
  ]
116
  }
117
  },
@@ -122,10 +122,10 @@
122
  "private": null,
123
  "tags": null,
124
  "license": null,
125
- "pretrained_path": "outputs/train/pi0_starai_lab1/checkpoints/last/pretrained_model",
126
  "paligemma_variant": "gemma_2b",
127
  "action_expert_variant": "gemma_300m",
128
- "dtype": "float32",
129
  "chunk_size": 50,
130
  "n_action_steps": 50,
131
  "max_state_dim": 32,
@@ -150,7 +150,7 @@
150
  "gradient_checkpointing": false,
151
  "compile_model": false,
152
  "compile_mode": "max-autotune",
153
- "optimizer_lr": 1e-05,
154
  "optimizer_betas": [
155
  0.9,
156
  0.95
@@ -163,21 +163,21 @@
163
  "scheduler_decay_lr": 2.5e-06,
164
  "tokenizer_max_length": 48
165
  },
166
- "output_dir": "/ws/dataset/outputs/train/pi0_starai_lab1",
167
- "job_name": "pi0_starai_lab1",
168
- "resume": true,
169
  "seed": 1000,
170
  "num_workers": 4,
171
- "batch_size": 16,
172
  "steps": 20000,
173
  "eval_freq": 20000,
174
  "log_freq": 100,
175
  "save_checkpoint": true,
176
- "save_freq": 5000,
177
  "use_policy_training_preset": true,
178
  "optimizer": {
179
  "type": "adamw",
180
- "lr": 1e-05,
181
  "weight_decay": 0.01,
182
  "grad_clip_norm": 1.0,
183
  "betas": [
@@ -190,7 +190,7 @@
190
  "type": "cosine_decay_with_warmup",
191
  "num_warmup_steps": 1000,
192
  "num_decay_steps": 30000,
193
- "peak_lr": 1e-05,
194
  "decay_lr": 2.5e-06
195
  },
196
  "eval": {
@@ -201,12 +201,12 @@
201
  "wandb": {
202
  "enable": true,
203
  "disable_artifact": true,
204
- "project": "pi0_starai_lab1-1110",
205
  "entity": null,
206
  "notes": null,
207
- "run_id": "9r007sbe",
208
  "mode": null
209
  },
210
- "checkpoint_path": "outputs/train/pi0_starai_lab1/checkpoints/last",
211
  "rename_map": {}
212
  }
 
1
  {
2
  "dataset": {
3
+ "repo_id": "alexhegit/so101_lab1",
4
+ "root": "/ws/so101-train/so101_dataset/",
5
  "episodes": null,
6
  "image_transforms": {
7
  "enable": false,
 
87
  "observation.state": {
88
  "type": "STATE",
89
  "shape": [
90
+ 6
91
  ]
92
  },
93
  "observation.images.top": {
 
111
  "action": {
112
  "type": "ACTION",
113
  "shape": [
114
+ 6
115
  ]
116
  }
117
  },
 
122
  "private": null,
123
  "tags": null,
124
  "license": null,
125
+ "pretrained_path": "lerobot/pi0_base",
126
  "paligemma_variant": "gemma_2b",
127
  "action_expert_variant": "gemma_300m",
128
+ "dtype": "bfloat16",
129
  "chunk_size": 50,
130
  "n_action_steps": 50,
131
  "max_state_dim": 32,
 
150
  "gradient_checkpointing": false,
151
  "compile_model": false,
152
  "compile_mode": "max-autotune",
153
+ "optimizer_lr": 2.5e-05,
154
  "optimizer_betas": [
155
  0.9,
156
  0.95
 
163
  "scheduler_decay_lr": 2.5e-06,
164
  "tokenizer_max_length": 48
165
  },
166
+ "output_dir": "/ws/so101-train/outputs/train/pi0_so101_lab1",
167
+ "job_name": "pi0_so101_lab1",
168
+ "resume": false,
169
  "seed": 1000,
170
  "num_workers": 4,
171
+ "batch_size": 32,
172
  "steps": 20000,
173
  "eval_freq": 20000,
174
  "log_freq": 100,
175
  "save_checkpoint": true,
176
+ "save_freq": 10000,
177
  "use_policy_training_preset": true,
178
  "optimizer": {
179
  "type": "adamw",
180
+ "lr": 2.5e-05,
181
  "weight_decay": 0.01,
182
  "grad_clip_norm": 1.0,
183
  "betas": [
 
190
  "type": "cosine_decay_with_warmup",
191
  "num_warmup_steps": 1000,
192
  "num_decay_steps": 30000,
193
+ "peak_lr": 2.5e-05,
194
  "decay_lr": 2.5e-06
195
  },
196
  "eval": {
 
201
  "wandb": {
202
  "enable": true,
203
  "disable_artifact": true,
204
+ "project": "pi0_so101_lab1-1118",
205
  "entity": null,
206
  "notes": null,
207
+ "run_id": "izior0oc",
208
  "mode": null
209
  },
210
+ "checkpoint_path": null,
211
  "rename_map": {}
212
  }