Robotics
LeRobot
Safetensors
smolvla
RonPlusSign commited on
Commit
4b3a508
·
verified ·
1 Parent(s): 68cf633

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. config.json +8 -8
  3. model.safetensors +2 -2
  4. train_config.json +15 -15
README.md CHANGED
@@ -1,14 +1,14 @@
1
  ---
2
  base_model: lerobot/smolvla_base
3
- datasets: RonPlusSign/RLBench-PutRubbishInBin-joint_positions
4
  library_name: lerobot
5
  license: apache-2.0
6
  model_name: smolvla
7
  pipeline_tag: robotics
8
  tags:
9
- - lerobot
10
- - smolvla
11
  - robotics
 
 
12
  ---
13
 
14
  # Model Card for smolvla
 
1
  ---
2
  base_model: lerobot/smolvla_base
3
+ datasets: RonPlusSign/RLBench-LeRobot-v3-PutRubbishInBin
4
  library_name: lerobot
5
  license: apache-2.0
6
  model_name: smolvla
7
  pipeline_tag: robotics
8
  tags:
 
 
9
  - robotics
10
+ - smolvla
11
+ - lerobot
12
  ---
13
 
14
  # Model Card for smolvla
config.json CHANGED
@@ -53,7 +53,7 @@
53
  "action": {
54
  "type": "ACTION",
55
  "shape": [
56
- 8
57
  ]
58
  }
59
  },
@@ -64,9 +64,9 @@
64
  "private": null,
65
  "tags": null,
66
  "license": null,
67
- "pretrained_path": "RonPlusSign/smolvla_base",
68
  "chunk_size": 50,
69
- "n_action_steps": 50,
70
  "normalization_mapping": {
71
  "VISUAL": "IDENTITY",
72
  "STATE": "MEAN_STD",
@@ -98,16 +98,16 @@
98
  "scheduler_warmup_steps": 1000,
99
  "scheduler_decay_steps": 30000,
100
  "scheduler_decay_lr": 2.5e-06,
101
- "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
102
  "load_vlm_weights": true,
103
  "add_image_special_tokens": false,
104
  "attention_mode": "cross_attn",
105
  "prefix_length": 0,
106
- "pad_language_to": "max_length",
107
- "num_expert_layers": 0,
108
- "num_vlm_layers": 16,
109
  "self_attn_every_n_layers": 2,
110
- "expert_width_multiplier": 0.75,
111
  "min_period": 0.004,
112
  "max_period": 4.0
113
  }
 
53
  "action": {
54
  "type": "ACTION",
55
  "shape": [
56
+ 7
57
  ]
58
  }
59
  },
 
64
  "private": null,
65
  "tags": null,
66
  "license": null,
67
+ "pretrained_path": "outputs/train/smolvla_finetuned_rubbish/checkpoints/last/pretrained_model",
68
  "chunk_size": 50,
69
+ "n_action_steps": 1,
70
  "normalization_mapping": {
71
  "VISUAL": "IDENTITY",
72
  "STATE": "MEAN_STD",
 
98
  "scheduler_warmup_steps": 1000,
99
  "scheduler_decay_steps": 30000,
100
  "scheduler_decay_lr": 2.5e-06,
101
+ "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Instruct",
102
  "load_vlm_weights": true,
103
  "add_image_special_tokens": false,
104
  "attention_mode": "cross_attn",
105
  "prefix_length": 0,
106
+ "pad_language_to": "longest",
107
+ "num_expert_layers": -1,
108
+ "num_vlm_layers": 0,
109
  "self_attn_every_n_layers": 2,
110
+ "expert_width_multiplier": 0.5,
111
  "min_period": 0.004,
112
  "max_period": 4.0
113
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3fcf2cfe93e6ee77831b0e6c8cb9a757be6caaefa67387db07f91ff62294f60
3
- size 906712520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1106fb447275318a9e1f3b013981a08414bd89f5ab55665c09d6cac79b9b5c62
3
+ size 1218047032
train_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "dataset": {
3
- "repo_id": "RonPlusSign/RLBench-PutRubbishInBin-joint_positions",
4
  "root": null,
5
  "episodes": null,
6
  "image_transforms": {
@@ -121,7 +121,7 @@
121
  "action": {
122
  "type": "ACTION",
123
  "shape": [
124
- 8
125
  ]
126
  }
127
  },
@@ -132,9 +132,9 @@
132
  "private": null,
133
  "tags": null,
134
  "license": null,
135
- "pretrained_path": "RonPlusSign/smolvla_base",
136
  "chunk_size": 50,
137
- "n_action_steps": 50,
138
  "normalization_mapping": {
139
  "VISUAL": "IDENTITY",
140
  "STATE": "MEAN_STD",
@@ -166,30 +166,30 @@
166
  "scheduler_warmup_steps": 1000,
167
  "scheduler_decay_steps": 30000,
168
  "scheduler_decay_lr": 2.5e-06,
169
- "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
170
  "load_vlm_weights": true,
171
  "add_image_special_tokens": false,
172
  "attention_mode": "cross_attn",
173
  "prefix_length": 0,
174
- "pad_language_to": "max_length",
175
- "num_expert_layers": 0,
176
- "num_vlm_layers": 16,
177
  "self_attn_every_n_layers": 2,
178
- "expert_width_multiplier": 0.75,
179
  "min_period": 0.004,
180
  "max_period": 4.0
181
  },
182
- "output_dir": "outputs/train/smolvla_finetuned_rubbish_joints",
183
  "job_name": "smolvla",
184
- "resume": false,
185
  "seed": 1000,
186
  "num_workers": 4,
187
- "batch_size": 64,
188
- "steps": 20000,
189
  "eval_freq": 20000,
190
  "log_freq": 200,
191
  "save_checkpoint": true,
192
- "save_freq": 20000,
193
  "use_policy_training_preset": true,
194
  "optimizer": {
195
  "type": "adamw",
@@ -220,7 +220,7 @@
220
  "project": "lerobot",
221
  "entity": null,
222
  "notes": null,
223
- "run_id": "o3rqxmof",
224
  "mode": null
225
  }
226
  }
 
1
  {
2
  "dataset": {
3
+ "repo_id": "RonPlusSign/RLBench-LeRobot-v3-PutRubbishInBin",
4
  "root": null,
5
  "episodes": null,
6
  "image_transforms": {
 
121
  "action": {
122
  "type": "ACTION",
123
  "shape": [
124
+ 7
125
  ]
126
  }
127
  },
 
132
  "private": null,
133
  "tags": null,
134
  "license": null,
135
+ "pretrained_path": "outputs/train/smolvla_finetuned_rubbish/checkpoints/last/pretrained_model",
136
  "chunk_size": 50,
137
+ "n_action_steps": 1,
138
  "normalization_mapping": {
139
  "VISUAL": "IDENTITY",
140
  "STATE": "MEAN_STD",
 
166
  "scheduler_warmup_steps": 1000,
167
  "scheduler_decay_steps": 30000,
168
  "scheduler_decay_lr": 2.5e-06,
169
+ "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Instruct",
170
  "load_vlm_weights": true,
171
  "add_image_special_tokens": false,
172
  "attention_mode": "cross_attn",
173
  "prefix_length": 0,
174
+ "pad_language_to": "longest",
175
+ "num_expert_layers": -1,
176
+ "num_vlm_layers": 0,
177
  "self_attn_every_n_layers": 2,
178
+ "expert_width_multiplier": 0.5,
179
  "min_period": 0.004,
180
  "max_period": 4.0
181
  },
182
+ "output_dir": "outputs/train/smolvla_finetuned_rubbish",
183
  "job_name": "smolvla",
184
+ "resume": true,
185
  "seed": 1000,
186
  "num_workers": 4,
187
+ "batch_size": 32,
188
+ "steps": 60000,
189
  "eval_freq": 20000,
190
  "log_freq": 200,
191
  "save_checkpoint": true,
192
+ "save_freq": 10000,
193
  "use_policy_training_preset": true,
194
  "optimizer": {
195
  "type": "adamw",
 
220
  "project": "lerobot",
221
  "entity": null,
222
  "notes": null,
223
+ "run_id": "gwlgotby",
224
  "mode": null
225
  }
226
  }