{ "output_dir": "$PROJECT_DIR/.cache/so100-train", "save_checkpoint": true, "seed": 1000, "eval_freq": 20000, "log_freq": 200, "save_checkpoint_freq": 20000, "hf_repo_id": "Ekami/act_pretrained", "env": null, "num_workers": 4, "name": "train-act", "batch_size": 8, "steps": 150000, "use_amp": false, "optimizer": {}, "scheduler": null, "eval": null, "wandb": { "enable": true, "entity": "peppy-bot", "project": "so100-train", "log_dir": "$PROJECT_DIR/.cache/wandb", "disable_artifact": false, "notes": "" }, "policy": { "type": "act", "n_obs_steps": 1, "chunk_size": 100, "n_action_steps": 100, "pretrained_path": null, "reward_delta_indices": null, "action_delta_indices": [ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99 ], "observation_delta_indices": null, "input_features": { "observation.state": { "type": "STATE", "shape": [ 6 ] }, "observation.images.front": { "type": "VISUAL", "shape": [ 3, 480, 640 ] }, "observation.images.wrist": { "type": "VISUAL", "shape": [ 3, 480, 640 ] } }, "output_features": { "action": { "type": "ACTION", "shape": [ 6 ] } }, "normalization_mapping": { "VISUAL": "MEAN_STD", "STATE": "MEAN_STD", "ACTION": "MEAN_STD" }, "checkpoint_config_save_fields": [ "type", "n_obs_steps", "normalization_mapping", "input_features", "output_features", "chunk_size", "n_action_steps", "vision_backbone", "pretrained_backbone_weights", "replace_final_stride_with_dilation", "pre_norm", "dim_model", "n_heads", "dim_feedforward", "feedforward_activation", "n_encoder_layers", "n_decoder_layers", "use_vae", "latent_dim", "n_vae_encoder_layers", "temporal_ensemble_coeff", "dropout", "kl_weight" ], "vision_backbone": "resnet18", "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", "replace_final_stride_with_dilation": false, "use_vae": true, "latent_dim": 32, "n_vae_encoder_layers": 4, "pre_norm": false, "dim_model": 512, "n_heads": 8, "dim_feedforward": 3200, "feedforward_activation": "relu", "n_encoder_layers": 4, "n_decoder_layers": 1, "dropout": 0.1, "kl_weight": 10.0, "optimizer_lr_backbone": 0.00001, "temporal_ensemble_coeff": null }, "dataset": { "dataset_dir": "$HF_HOME/lerobot", "video_backend": "torchcodec", "single_task": "stack_bricks", "repo_id": "Ekami/so100", "revision": "main", "pull_from_hf_hub": true, "use_imagenet_stats": true } }