Robotics
LeRobot
Safetensors
smolvla
ethanCSL commited on
Commit
7b8bcb6
·
verified ·
1 Parent(s): b2663de

Upload policy weights, train config and readme

Browse files
Files changed (4) hide show
  1. README.md +1 -1
  2. config.json +2 -2
  3. model.safetensors +1 -1
  4. train_config.json +2 -2
README.md CHANGED
@@ -6,8 +6,8 @@ license: apache-2.0
6
  model_name: smolvla
7
  pipeline_tag: robotics
8
  tags:
9
- - robotics
10
  - smolvla
 
11
  - lerobot
12
  ---
13
 
 
6
  model_name: smolvla
7
  pipeline_tag: robotics
8
  tags:
 
9
  - smolvla
10
+ - robotics
11
  - lerobot
12
  ---
13
 
config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "type": "smolvla",
3
- "n_obs_steps": 1,
4
  "normalization_mapping": {
5
  "VISUAL": "IDENTITY",
6
  "STATE": "MEAN_STD",
@@ -75,7 +75,7 @@
75
  "scheduler_decay_lr": 2.5e-06,
76
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
77
  "load_vlm_weights": true,
78
- "add_image_special_tokens": false,
79
  "attention_mode": "cross_attn",
80
  "prefix_length": 0,
81
  "pad_language_to": "max_length",
 
1
  {
2
  "type": "smolvla",
3
+ "n_obs_steps": 2,
4
  "normalization_mapping": {
5
  "VISUAL": "IDENTITY",
6
  "STATE": "MEAN_STD",
 
75
  "scheduler_decay_lr": 2.5e-06,
76
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
77
  "load_vlm_weights": true,
78
+ "add_image_special_tokens": true,
79
  "attention_mode": "cross_attn",
80
  "prefix_length": 0,
81
  "pad_language_to": "max_length",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f7a028858fda986532adb9ab47240d59f540dcb5e014c2c7b0df7b735dc81ff
3
  size 906713296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d21ec3e915b40cef0eaadca1a3bc4a1a6b90b25b7f4d0101e9685c066bf6416
3
  size 906713296
train_config.json CHANGED
@@ -67,7 +67,7 @@
67
  "env": null,
68
  "policy": {
69
  "type": "smolvla",
70
- "n_obs_steps": 1,
71
  "normalization_mapping": {
72
  "VISUAL": "IDENTITY",
73
  "STATE": "MEAN_STD",
@@ -142,7 +142,7 @@
142
  "scheduler_decay_lr": 2.5e-06,
143
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
144
  "load_vlm_weights": true,
145
- "add_image_special_tokens": false,
146
  "attention_mode": "cross_attn",
147
  "prefix_length": 0,
148
  "pad_language_to": "max_length",
 
67
  "env": null,
68
  "policy": {
69
  "type": "smolvla",
70
+ "n_obs_steps": 2,
71
  "normalization_mapping": {
72
  "VISUAL": "IDENTITY",
73
  "STATE": "MEAN_STD",
 
142
  "scheduler_decay_lr": 2.5e-06,
143
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
144
  "load_vlm_weights": true,
145
+ "add_image_special_tokens": true,
146
  "attention_mode": "cross_attn",
147
  "prefix_length": 0,
148
  "pad_language_to": "max_length",