Upload policy weights, train config and readme

Browse files

Files changed (4) hide show

README.md +5 -8
config.json +69 -0
model.safetensors +3 -0
train_config.json +175 -0

README.md CHANGED Viewed

@@ -1,24 +1,21 @@
 ---
-datasets:
-- SonDePoisson/so101_test_dataset
 library_name: lerobot
 license: apache-2.0
-model_name: reward_classifier
 pipeline_tag: robotics
 tags:
 - lerobot
-- reward_classifier
 - robotics
-base_model:
-- lerobot/smolvla_base
 ---
-# Model Card for reward_classifier
 <!-- Provide a quick summary of what the model is/does. -->
-A reward classifier is a lightweight neural network that scores observations or trajectories for task success, providing a learned reward signal or offline evaluation when explicit rewards are unavailable.
 This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).

 ---
+datasets: SonDePoisson/so101_test_dataset
 library_name: lerobot
 license: apache-2.0
+model_name: act
 pipeline_tag: robotics
 tags:
+- act
 - lerobot
 - robotics
 ---
+# Model Card for act
 <!-- Provide a quick summary of what the model is/does. -->
+[Action Chunking with Transformers (ACT)](https://huggingface.co/papers/2304.13705) is an imitation-learning method that predicts short action chunks instead of single steps. It learns from teleoperated data and often achieves high success rates.
 This policy has been trained and pushed to the Hub using [LeRobot](https://github.com/huggingface/lerobot).

config.json ADDED Viewed

	@@ -0,0 +1,69 @@

+{
+    "type": "act",
+    "n_obs_steps": 1,
+    "normalization_mapping": {
+        "VISUAL": "MEAN_STD",
+        "STATE": "MEAN_STD",
+        "ACTION": "MEAN_STD"
+    },
+    "input_features": {
+        "observation.state": {
+            "type": "STATE",
+            "shape": [
+                21
+            ]
+        },
+        "observation.images.side": {
+            "type": "VISUAL",
+            "shape": [
+                3,
+                256,
+                256
+            ]
+        },
+        "observation.images.top": {
+            "type": "VISUAL",
+            "shape": [
+                3,
+                256,
+                256
+            ]
+        }
+    },
+    "output_features": {
+        "action": {
+            "type": "ACTION",
+            "shape": [
+                4
+            ]
+        }
+    },
+    "device": "mps",
+    "use_amp": false,
+    "push_to_hub": true,
+    "repo_id": "SonDePoisson/so101_test_model",
+    "private": null,
+    "tags": null,
+    "license": null,
+    "chunk_size": 100,
+    "n_action_steps": 100,
+    "vision_backbone": "resnet18",
+    "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
+    "replace_final_stride_with_dilation": false,
+    "pre_norm": false,
+    "dim_model": 512,
+    "n_heads": 8,
+    "dim_feedforward": 3200,
+    "feedforward_activation": "relu",
+    "n_encoder_layers": 4,
+    "n_decoder_layers": 1,
+    "use_vae": true,
+    "latent_dim": 32,
+    "n_vae_encoder_layers": 4,
+    "temporal_ensemble_coeff": null,
+    "dropout": 0.1,
+    "kl_weight": 10.0,
+    "optimizer_lr": 1e-05,
+    "optimizer_weight_decay": 0.0001,
+    "optimizer_lr_backbone": 1e-05
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61ad9b11299ec080a64c52178d54041ea775aba6b5e6e959a93c61a0f4b1177a
+size 206754384

train_config.json ADDED Viewed

	@@ -0,0 +1,175 @@

+{
+    "dataset": {
+        "repo_id": "SonDePoisson/so101_test_dataset",
+        "root": ".dev/datasets/SonDePoisson/so101_test_dataset",
+        "episodes": null,
+        "image_transforms": {
+            "enable": false,
+            "max_num_transforms": 3,
+            "random_order": false,
+            "tfs": {
+                "brightness": {
+                    "weight": 1.0,
+                    "type": "ColorJitter",
+                    "kwargs": {
+                        "brightness": [
+                            0.8,
+                            1.2
+                        ]
+                    }
+                },
+                "contrast": {
+                    "weight": 1.0,
+                    "type": "ColorJitter",
+                    "kwargs": {
+                        "contrast": [
+                            0.8,
+                            1.2
+                        ]
+                    }
+                },
+                "saturation": {
+                    "weight": 1.0,
+                    "type": "ColorJitter",
+                    "kwargs": {
+                        "saturation": [
+                            0.5,
+                            1.5
+                        ]
+                    }
+                },
+                "hue": {
+                    "weight": 1.0,
+                    "type": "ColorJitter",
+                    "kwargs": {
+                        "hue": [
+                            -0.05,
+                            0.05
+                        ]
+                    }
+                },
+                "sharpness": {
+                    "weight": 1.0,
+                    "type": "SharpnessJitter",
+                    "kwargs": {
+                        "sharpness": [
+                            0.5,
+                            1.5
+                        ]
+                    }
+                }
+            }
+        },
+        "revision": null,
+        "use_imagenet_stats": true,
+        "video_backend": "torchcodec"
+    },
+    "env": null,
+    "policy": {
+        "type": "act",
+        "n_obs_steps": 1,
+        "normalization_mapping": {
+            "VISUAL": "MEAN_STD",
+            "STATE": "MEAN_STD",
+            "ACTION": "MEAN_STD"
+        },
+        "input_features": {
+            "observation.state": {
+                "type": "STATE",
+                "shape": [
+                    21
+                ]
+            },
+            "observation.images.side": {
+                "type": "VISUAL",
+                "shape": [
+                    3,
+                    256,
+                    256
+                ]
+            },
+            "observation.images.top": {
+                "type": "VISUAL",
+                "shape": [
+                    3,
+                    256,
+                    256
+                ]
+            }
+        },
+        "output_features": {
+            "action": {
+                "type": "ACTION",
+                "shape": [
+                    4
+                ]
+            }
+        },
+        "device": "mps",
+        "use_amp": false,
+        "push_to_hub": true,
+        "repo_id": "SonDePoisson/so101_test_model",
+        "private": null,
+        "tags": null,
+        "license": null,
+        "chunk_size": 100,
+        "n_action_steps": 100,
+        "vision_backbone": "resnet18",
+        "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
+        "replace_final_stride_with_dilation": false,
+        "pre_norm": false,
+        "dim_model": 512,
+        "n_heads": 8,
+        "dim_feedforward": 3200,
+        "feedforward_activation": "relu",
+        "n_encoder_layers": 4,
+        "n_decoder_layers": 1,
+        "use_vae": true,
+        "latent_dim": 32,
+        "n_vae_encoder_layers": 4,
+        "temporal_ensemble_coeff": null,
+        "dropout": 0.1,
+        "kl_weight": 10.0,
+        "optimizer_lr": 1e-05,
+        "optimizer_weight_decay": 0.0001,
+        "optimizer_lr_backbone": 1e-05
+    },
+    "output_dir": "outputs/train/2025-08-27/10-42-53_so101_training",
+    "job_name": "so101_training",
+    "resume": false,
+    "seed": 1000,
+    "num_workers": 8,
+    "batch_size": 8,
+    "steps": 10000,
+    "eval_freq": 20000,
+    "log_freq": 200,
+    "save_checkpoint": true,
+    "save_freq": 20000,
+    "use_policy_training_preset": true,
+    "optimizer": {
+        "type": "adamw",
+        "lr": 1e-05,
+        "weight_decay": 0.0001,
+        "grad_clip_norm": 10.0,
+        "betas": [
+            0.9,
+            0.999
+        ],
+        "eps": 1e-08
+    },
+    "scheduler": null,
+    "eval": {
+        "n_episodes": 50,
+        "batch_size": 50,
+        "use_async_envs": false
+    },
+    "wandb": {
+        "enable": true,
+        "disable_artifact": false,
+        "project": "so101_training",
+        "entity": null,
+        "notes": null,
+        "run_id": "6ppdcojk",
+        "mode": null
+    }
+}