Orellius commited on
Commit
411ca71
·
verified ·
1 Parent(s): 38674bc

Upload model checkpoint from pretrained_model

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. model.safetensors +1 -1
  3. train_config.json +17 -17
config.json CHANGED
@@ -33,7 +33,7 @@
33
  "private": null,
34
  "tags": null,
35
  "license": null,
36
- "pretrained_path": "outputs/train/so101_sort_so101_sort_smolvla_20251107_2019/checkpoints/last/pretrained_model",
37
  "chunk_size": 50,
38
  "n_action_steps": 50,
39
  "normalization_mapping": {
@@ -56,16 +56,16 @@
56
  "freeze_vision_encoder": true,
57
  "train_expert_only": true,
58
  "train_state_proj": true,
59
- "optimizer_lr": 0.0003,
60
  "optimizer_betas": [
61
  0.9,
62
  0.95
63
  ],
64
  "optimizer_eps": 1e-08,
65
  "optimizer_weight_decay": 1e-10,
66
- "optimizer_grad_clip_norm": 10.0,
67
- "scheduler_warmup_steps": 350,
68
- "scheduler_decay_steps": 7000,
69
  "scheduler_decay_lr": 2.5e-06,
70
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
71
  "load_vlm_weights": false,
 
33
  "private": null,
34
  "tags": null,
35
  "license": null,
36
+ "pretrained_path": null,
37
  "chunk_size": 50,
38
  "n_action_steps": 50,
39
  "normalization_mapping": {
 
56
  "freeze_vision_encoder": true,
57
  "train_expert_only": true,
58
  "train_state_proj": true,
59
+ "optimizer_lr": 0.0001,
60
  "optimizer_betas": [
61
  0.9,
62
  0.95
63
  ],
64
  "optimizer_eps": 1e-08,
65
  "optimizer_weight_decay": 1e-10,
66
+ "optimizer_grad_clip_norm": 10,
67
+ "scheduler_warmup_steps": 10000,
68
+ "scheduler_decay_steps": 200000,
69
  "scheduler_decay_lr": 2.5e-06,
70
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
71
  "load_vlm_weights": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6265a9d5b6b0b093f931192c8a92657d6aeabd8425f0081922d71b6fce508d72
3
  size 1197789224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef6debe8b189c220f6251cc5bf14390893588620adb0dabd1dd82a3ab8e272b6
3
  size 1197789224
train_config.json CHANGED
@@ -101,7 +101,7 @@
101
  "private": null,
102
  "tags": null,
103
  "license": null,
104
- "pretrained_path": "outputs/train/so101_sort_so101_sort_smolvla_20251107_2019/checkpoints/last/pretrained_model",
105
  "chunk_size": 50,
106
  "n_action_steps": 50,
107
  "normalization_mapping": {
@@ -124,16 +124,16 @@
124
  "freeze_vision_encoder": true,
125
  "train_expert_only": true,
126
  "train_state_proj": true,
127
- "optimizer_lr": 0.0003,
128
  "optimizer_betas": [
129
  0.9,
130
  0.95
131
  ],
132
  "optimizer_eps": 1e-08,
133
  "optimizer_weight_decay": 1e-10,
134
- "optimizer_grad_clip_norm": 10.0,
135
- "scheduler_warmup_steps": 350,
136
- "scheduler_decay_steps": 7000,
137
  "scheduler_decay_lr": 2.5e-06,
138
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
139
  "load_vlm_weights": false,
@@ -148,13 +148,13 @@
148
  "min_period": 0.004,
149
  "max_period": 4.0
150
  },
151
- "output_dir": "outputs/train/so101_sort_so101_sort_smolvla_20251107_2019",
152
- "job_name": "so101_sort_so101_sort_smolvla_20251107_2019",
153
- "resume": true,
154
  "seed": 1000,
155
  "num_workers": 4,
156
- "batch_size": 4,
157
- "steps": 7000,
158
  "eval_freq": 200,
159
  "log_freq": 100,
160
  "save_checkpoint": true,
@@ -162,9 +162,9 @@
162
  "use_policy_training_preset": true,
163
  "optimizer": {
164
  "type": "adamw",
165
- "lr": 0.0003,
166
  "weight_decay": 1e-10,
167
- "grad_clip_norm": 10.0,
168
  "betas": [
169
  0.9,
170
  0.95
@@ -173,9 +173,9 @@
173
  },
174
  "scheduler": {
175
  "type": "cosine_decay_with_warmup",
176
- "num_warmup_steps": 250,
177
- "num_decay_steps": 5000,
178
- "peak_lr": 0.0003,
179
  "decay_lr": 2.5e-06
180
  },
181
  "eval": {
@@ -184,12 +184,12 @@
184
  "use_async_envs": false
185
  },
186
  "wandb": {
187
- "enable": false,
188
  "disable_artifact": false,
189
  "project": "lerobot-shabby",
190
  "entity": null,
191
  "notes": null,
192
- "run_id": null,
193
  "mode": null
194
  },
195
  "peft": null
 
101
  "private": null,
102
  "tags": null,
103
  "license": null,
104
+ "pretrained_path": null,
105
  "chunk_size": 50,
106
  "n_action_steps": 50,
107
  "normalization_mapping": {
 
124
  "freeze_vision_encoder": true,
125
  "train_expert_only": true,
126
  "train_state_proj": true,
127
+ "optimizer_lr": 0.0001,
128
  "optimizer_betas": [
129
  0.9,
130
  0.95
131
  ],
132
  "optimizer_eps": 1e-08,
133
  "optimizer_weight_decay": 1e-10,
134
+ "optimizer_grad_clip_norm": 10,
135
+ "scheduler_warmup_steps": 10000,
136
+ "scheduler_decay_steps": 200000,
137
  "scheduler_decay_lr": 2.5e-06,
138
  "vlm_model_name": "HuggingFaceTB/SmolVLM2-500M-Video-Instruct",
139
  "load_vlm_weights": false,
 
148
  "min_period": 0.004,
149
  "max_period": 4.0
150
  },
151
+ "output_dir": "outputs/train/so101_sort_so101_sort_smolvla_20251110_0139",
152
+ "job_name": "so101_sort_so101_sort_smolvla_20251110_0139",
153
+ "resume": false,
154
  "seed": 1000,
155
  "num_workers": 4,
156
+ "batch_size": 64,
157
+ "steps": 200000,
158
  "eval_freq": 200,
159
  "log_freq": 100,
160
  "save_checkpoint": true,
 
162
  "use_policy_training_preset": true,
163
  "optimizer": {
164
  "type": "adamw",
165
+ "lr": 0.0001,
166
  "weight_decay": 1e-10,
167
+ "grad_clip_norm": 10,
168
  "betas": [
169
  0.9,
170
  0.95
 
173
  },
174
  "scheduler": {
175
  "type": "cosine_decay_with_warmup",
176
+ "num_warmup_steps": 10000,
177
+ "num_decay_steps": 200000,
178
+ "peak_lr": 0.0001,
179
  "decay_lr": 2.5e-06
180
  },
181
  "eval": {
 
184
  "use_async_envs": false
185
  },
186
  "wandb": {
187
+ "enable": true,
188
  "disable_artifact": false,
189
  "project": "lerobot-shabby",
190
  "entity": null,
191
  "notes": null,
192
+ "run_id": "dzsh8gnl",
193
  "mode": null
194
  },
195
  "peft": null