Robotics
LeRobot
Safetensors
smolvla
JinghuiLuAstronaut commited on
Commit
c91936c
·
verified ·
1 Parent(s): 0564a01

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. config.json +5 -5
  3. model.safetensors +2 -2
  4. train_config.json +13 -13
README.md CHANGED
@@ -7,8 +7,8 @@ model_name: smolvla
7
  pipeline_tag: robotics
8
  tags:
9
  - lerobot
10
- - smolvla
11
  - robotics
 
12
  ---
13
 
14
  # Model Card for smolvla
 
7
  pipeline_tag: robotics
8
  tags:
9
  - lerobot
 
10
  - robotics
11
+ - smolvla
12
  ---
13
 
14
  # Model Card for smolvla
config.json CHANGED
@@ -69,17 +69,17 @@
69
  ],
70
  "optimizer_eps": 1e-08,
71
  "optimizer_weight_decay": 1e-10,
72
- "optimizer_grad_clip_norm": 10,
73
  "scheduler_warmup_steps": 1000,
74
  "scheduler_decay_steps": 30000,
75
  "scheduler_decay_lr": 2.5e-06,
76
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
77
- "load_vlm_weights": false,
78
  "add_image_special_tokens": false,
79
  "attention_mode": "cross_attn",
80
- "prefix_length": -1,
81
- "pad_language_to": "longest",
82
- "num_expert_layers": -1,
83
  "num_vlm_layers": 16,
84
  "self_attn_every_n_layers": 2,
85
  "expert_width_multiplier": 0.75,
 
69
  ],
70
  "optimizer_eps": 1e-08,
71
  "optimizer_weight_decay": 1e-10,
72
+ "optimizer_grad_clip_norm": 10.0,
73
  "scheduler_warmup_steps": 1000,
74
  "scheduler_decay_steps": 30000,
75
  "scheduler_decay_lr": 2.5e-06,
76
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
77
+ "load_vlm_weights": true,
78
  "add_image_special_tokens": false,
79
  "attention_mode": "cross_attn",
80
+ "prefix_length": 0,
81
+ "pad_language_to": "max_length",
82
+ "num_expert_layers": 0,
83
  "num_vlm_layers": 16,
84
  "self_attn_every_n_layers": 2,
85
  "expert_width_multiplier": 0.75,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dca556518ae84d1bc5c2a621f32cc7f5b1dfab165f4db0eaacb46f593911f9b5
3
- size 1197790048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00e108ddc7be5e3c46222bad6372af6151e4dccdf435ef4ad71ba9639332e698
3
+ size 906713328
train_config.json CHANGED
@@ -136,17 +136,17 @@
136
  ],
137
  "optimizer_eps": 1e-08,
138
  "optimizer_weight_decay": 1e-10,
139
- "optimizer_grad_clip_norm": 10,
140
  "scheduler_warmup_steps": 1000,
141
  "scheduler_decay_steps": 30000,
142
  "scheduler_decay_lr": 2.5e-06,
143
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
144
- "load_vlm_weights": false,
145
  "add_image_special_tokens": false,
146
  "attention_mode": "cross_attn",
147
- "prefix_length": -1,
148
- "pad_language_to": "longest",
149
- "num_expert_layers": -1,
150
  "num_vlm_layers": 16,
151
  "self_attn_every_n_layers": 2,
152
  "expert_width_multiplier": 0.75,
@@ -154,22 +154,22 @@
154
  "max_period": 4.0
155
  },
156
  "output_dir": "outputs/train/smolvla-spatial",
157
- "job_name": "smolvla_so101",
158
  "resume": false,
159
  "seed": 1000,
160
  "num_workers": 4,
161
  "batch_size": 64,
162
- "steps": 200000,
163
  "eval_freq": 20000,
164
- "log_freq": 200,
165
  "save_checkpoint": true,
166
- "save_freq": 20000,
167
  "use_policy_training_preset": true,
168
  "optimizer": {
169
  "type": "adamw",
170
  "lr": 0.0001,
171
  "weight_decay": 1e-10,
172
- "grad_clip_norm": 10,
173
  "betas": [
174
  0.9,
175
  0.95
@@ -189,12 +189,12 @@
189
  "use_async_envs": false
190
  },
191
  "wandb": {
192
- "enable": false,
193
  "disable_artifact": false,
194
- "project": "lerobot",
195
  "entity": null,
196
  "notes": null,
197
- "run_id": null,
198
  "mode": null
199
  }
200
  }
 
136
  ],
137
  "optimizer_eps": 1e-08,
138
  "optimizer_weight_decay": 1e-10,
139
+ "optimizer_grad_clip_norm": 10.0,
140
  "scheduler_warmup_steps": 1000,
141
  "scheduler_decay_steps": 30000,
142
  "scheduler_decay_lr": 2.5e-06,
143
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
144
+ "load_vlm_weights": true,
145
  "add_image_special_tokens": false,
146
  "attention_mode": "cross_attn",
147
+ "prefix_length": 0,
148
+ "pad_language_to": "max_length",
149
+ "num_expert_layers": 0,
150
  "num_vlm_layers": 16,
151
  "self_attn_every_n_layers": 2,
152
  "expert_width_multiplier": 0.75,
 
154
  "max_period": 4.0
155
  },
156
  "output_dir": "outputs/train/smolvla-spatial",
157
+ "job_name": "smolvla_libero_spatial",
158
  "resume": false,
159
  "seed": 1000,
160
  "num_workers": 4,
161
  "batch_size": 64,
162
+ "steps": 100000,
163
  "eval_freq": 20000,
164
+ "log_freq": 1,
165
  "save_checkpoint": true,
166
+ "save_freq": 2000,
167
  "use_policy_training_preset": true,
168
  "optimizer": {
169
  "type": "adamw",
170
  "lr": 0.0001,
171
  "weight_decay": 1e-10,
172
+ "grad_clip_norm": 10.0,
173
  "betas": [
174
  0.9,
175
  0.95
 
189
  "use_async_envs": false
190
  },
191
  "wandb": {
192
+ "enable": true,
193
  "disable_artifact": false,
194
+ "project": "lerobot_ljh",
195
  "entity": null,
196
  "notes": null,
197
+ "run_id": "run_20250818_b689510d",
198
  "mode": null
199
  }
200
  }