act_pretrained / train_config.json
Ekami's picture
Checkpoint step 40000 from wandb https://wandb.ai/peppy-bot/so100-train/runs/jvrbm4sf
476917d verified
{
"output_dir": "$PROJECT_DIR/.cache/so100-train",
"save_checkpoint": true,
"seed": 1000,
"eval_freq": 20000,
"log_freq": 200,
"save_checkpoint_freq": 20000,
"hf_repo_id": "Ekami/act_pretrained",
"env": null,
"num_workers": 4,
"name": "train-act",
"batch_size": 8,
"steps": 150000,
"use_amp": false,
"optimizer": {},
"scheduler": null,
"eval": null,
"wandb": {
"enable": true,
"entity": "peppy-bot",
"project": "so100-train",
"log_dir": "$PROJECT_DIR/.cache/wandb",
"disable_artifact": false,
"notes": ""
},
"policy": {
"type": "act",
"n_obs_steps": 1,
"chunk_size": 100,
"n_action_steps": 100,
"pretrained_path": null,
"reward_delta_indices": null,
"action_delta_indices": [
0,
1,
2,
3,
4,
5,
6,
7,
8,
9,
10,
11,
12,
13,
14,
15,
16,
17,
18,
19,
20,
21,
22,
23,
24,
25,
26,
27,
28,
29,
30,
31,
32,
33,
34,
35,
36,
37,
38,
39,
40,
41,
42,
43,
44,
45,
46,
47,
48,
49,
50,
51,
52,
53,
54,
55,
56,
57,
58,
59,
60,
61,
62,
63,
64,
65,
66,
67,
68,
69,
70,
71,
72,
73,
74,
75,
76,
77,
78,
79,
80,
81,
82,
83,
84,
85,
86,
87,
88,
89,
90,
91,
92,
93,
94,
95,
96,
97,
98,
99
],
"observation_delta_indices": null,
"input_features": {
"observation.state": {
"type": "STATE",
"shape": [
6
]
},
"observation.images.front": {
"type": "VISUAL",
"shape": [
3,
480,
640
]
},
"observation.images.wrist": {
"type": "VISUAL",
"shape": [
3,
480,
640
]
}
},
"output_features": {
"action": {
"type": "ACTION",
"shape": [
6
]
}
},
"normalization_mapping": {
"VISUAL": "MEAN_STD",
"STATE": "MEAN_STD",
"ACTION": "MEAN_STD"
},
"checkpoint_config_save_fields": [
"type",
"n_obs_steps",
"normalization_mapping",
"input_features",
"output_features",
"chunk_size",
"n_action_steps",
"vision_backbone",
"pretrained_backbone_weights",
"replace_final_stride_with_dilation",
"pre_norm",
"dim_model",
"n_heads",
"dim_feedforward",
"feedforward_activation",
"n_encoder_layers",
"n_decoder_layers",
"use_vae",
"latent_dim",
"n_vae_encoder_layers",
"temporal_ensemble_coeff",
"dropout",
"kl_weight"
],
"vision_backbone": "resnet18",
"pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1",
"replace_final_stride_with_dilation": false,
"use_vae": true,
"latent_dim": 32,
"n_vae_encoder_layers": 4,
"pre_norm": false,
"dim_model": 512,
"n_heads": 8,
"dim_feedforward": 3200,
"feedforward_activation": "relu",
"n_encoder_layers": 4,
"n_decoder_layers": 1,
"dropout": 0.1,
"kl_weight": 10.0,
"optimizer_lr_backbone": 0.00001,
"temporal_ensemble_coeff": null
},
"dataset": {
"dataset_dir": "$HF_HOME/lerobot",
"video_backend": "torchcodec",
"single_task": "stack_bricks",
"repo_id": "Ekami/so100",
"revision": "main",
"pull_from_hf_hub": true,
"use_imagenet_stats": true
}
}