Instructions to use dnn1002/smolvla_base with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- LeRobot
How to use dnn1002/smolvla_base with LeRobot:
# See https://github.com/huggingface/lerobot?tab=readme-ov-file#installation for more details git clone https://github.com/huggingface/lerobot.git cd lerobot pip install -e .[smolvla]
# Launch finetuning on your dataset python lerobot/scripts/train.py \ --policy.path=dnn1002/smolvla_base \ --dataset.repo_id=lerobot/svla_so101_pickplace \ --batch_size=64 \ --steps=20000 \ --output_dir=outputs/train/my_smolvla \ --job_name=my_smolvla_training \ --policy.device=cuda \ --wandb.enable=true
# Run the policy using the record function python -m lerobot.record \ --robot.type=so101_follower \ --robot.port=/dev/ttyACM0 \ # <- Use your port --robot.id=my_blue_follower_arm \ # <- Use your robot id --robot.cameras="{ front: {type: opencv, index_or_path: 8, width: 640, height: 480, fps: 30}}" \ # <- Use your cameras --dataset.single_task="Grasp a lego block and put it in the bin." \ # <- Use the same task description you used in your dataset recording --dataset.repo_id=HF_USER/dataset_name \ # <- This will be the dataset name on HF Hub --dataset.episode_time_s=50 \ --dataset.num_episodes=10 \ --policy.path=dnn1002/smolvla_base - Notebooks
- Google Colab
- Kaggle
Upload policy weights, train config and readme
Browse files- README.md +1 -1
- config.json +1 -1
- model.safetensors +1 -1
- train_config.json +5 -5
README.md
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
---
|
| 2 |
base_model: lerobot/smolvla_base
|
| 3 |
-
datasets: dnn1002/so101-simple-
|
| 4 |
library_name: lerobot
|
| 5 |
license: apache-2.0
|
| 6 |
model_name: smolvla
|
|
|
|
| 1 |
---
|
| 2 |
base_model: lerobot/smolvla_base
|
| 3 |
+
datasets: dnn1002/so101-simple-pickup-2-cameras
|
| 4 |
library_name: lerobot
|
| 5 |
license: apache-2.0
|
| 6 |
model_name: smolvla
|
config.json
CHANGED
|
@@ -49,7 +49,7 @@
|
|
| 49 |
"private": null,
|
| 50 |
"tags": null,
|
| 51 |
"license": null,
|
| 52 |
-
"pretrained_path": "outputs/train/smolvla/checkpoints/
|
| 53 |
"chunk_size": 50,
|
| 54 |
"n_action_steps": 50,
|
| 55 |
"normalization_mapping": {
|
|
|
|
| 49 |
"private": null,
|
| 50 |
"tags": null,
|
| 51 |
"license": null,
|
| 52 |
+
"pretrained_path": "outputs/train/smolvla/checkpoints/last/pretrained_model",
|
| 53 |
"chunk_size": 50,
|
| 54 |
"n_action_steps": 50,
|
| 55 |
"normalization_mapping": {
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 906712520
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45e009a95f14e3bec242c23513a628d9189afc484943feff57bc0e811d8b6c2b
|
| 3 |
size 906712520
|
train_config.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"dataset": {
|
| 3 |
-
"repo_id": "dnn1002/so101-simple-
|
| 4 |
"root": null,
|
| 5 |
"episodes": null,
|
| 6 |
"image_transforms": {
|
|
@@ -131,7 +131,7 @@
|
|
| 131 |
"private": null,
|
| 132 |
"tags": null,
|
| 133 |
"license": null,
|
| 134 |
-
"pretrained_path": "outputs/train/smolvla/checkpoints/
|
| 135 |
"chunk_size": 50,
|
| 136 |
"n_action_steps": 50,
|
| 137 |
"normalization_mapping": {
|
|
@@ -187,8 +187,8 @@
|
|
| 187 |
"seed": 1000,
|
| 188 |
"cudnn_deterministic": false,
|
| 189 |
"num_workers": 4,
|
| 190 |
-
"batch_size":
|
| 191 |
-
"steps":
|
| 192 |
"eval_freq": 20000,
|
| 193 |
"log_freq": 200,
|
| 194 |
"tolerance_s": 0.0001,
|
|
@@ -238,5 +238,5 @@
|
|
| 238 |
"observation.images.gripper": "observation.images.camera1",
|
| 239 |
"observation.images.top": "observation.images.camera2"
|
| 240 |
},
|
| 241 |
-
"checkpoint_path": "outputs/train/smolvla/checkpoints/
|
| 242 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"dataset": {
|
| 3 |
+
"repo_id": "dnn1002/so101-simple-pickup-2-cameras",
|
| 4 |
"root": null,
|
| 5 |
"episodes": null,
|
| 6 |
"image_transforms": {
|
|
|
|
| 131 |
"private": null,
|
| 132 |
"tags": null,
|
| 133 |
"license": null,
|
| 134 |
+
"pretrained_path": "outputs/train/smolvla/checkpoints/last/pretrained_model",
|
| 135 |
"chunk_size": 50,
|
| 136 |
"n_action_steps": 50,
|
| 137 |
"normalization_mapping": {
|
|
|
|
| 187 |
"seed": 1000,
|
| 188 |
"cudnn_deterministic": false,
|
| 189 |
"num_workers": 4,
|
| 190 |
+
"batch_size": 16,
|
| 191 |
+
"steps": 50000,
|
| 192 |
"eval_freq": 20000,
|
| 193 |
"log_freq": 200,
|
| 194 |
"tolerance_s": 0.0001,
|
|
|
|
| 238 |
"observation.images.gripper": "observation.images.camera1",
|
| 239 |
"observation.images.top": "observation.images.camera2"
|
| 240 |
},
|
| 241 |
+
"checkpoint_path": "outputs/train/smolvla/checkpoints/last"
|
| 242 |
}
|