sac / config.json
yfynb1111's picture
Upload policy
abbb998 verified
{
"type": "sac",
"n_obs_steps": 1,
"normalization_mapping": {
"VISUAL": "MEAN_STD",
"STATE": "MIN_MAX",
"ENV": "MIN_MAX",
"ACTION": "MIN_MAX"
},
"input_features": {
"observation.images.front": {
"type": "VISUAL",
"shape": [
3,
128,
128
]
},
"observation.images.wrist": {
"type": "VISUAL",
"shape": [
3,
128,
128
]
},
"observation.state": {
"type": "STATE",
"shape": [
18
]
}
},
"output_features": {
"action": {
"type": "ACTION",
"shape": [
3
]
}
},
"device": "cuda",
"use_amp": false,
"push_to_hub": true,
"repo_id": "yfynb1111/sac",
"private": null,
"tags": null,
"license": null,
"dataset_stats": {
"observation.images.front": {
"mean": [
0.485,
0.456,
0.406
],
"std": [
0.229,
0.224,
0.225
]
},
"observation.images.wrist": {
"mean": [
0.485,
0.456,
0.406
],
"std": [
0.229,
0.224,
0.225
]
},
"observation.state": {
"min": [
-0.6897139549255371,
-1.1421763896942139,
-0.5745007991790771,
-2.97829008102417,
-0.2710767090320587,
1.3246592283248901,
-0.04057434946298599,
-0.21261805295944214,
-0.4548068344593048,
-0.6540042757987976,
-0.3644964098930359,
-1.1057522296905518,
-0.40768879652023315,
-0.2220114767551422,
0.0,
0.19176171720027924,
-0.3013063669204712,
0.00362197193317115
],
"max": [
0.5107022523880005,
0.5516204237937927,
0.5620884299278259,
-1.3330878019332886,
0.32758936285972595,
3.119610548019409,
1.8364211320877075,
0.25358933210372925,
0.36316126585006714,
0.14765967428684235,
0.49947625398635864,
0.144814133644104,
0.2820609211921692,
0.7382049560546875,
255.0,
0.6012658476829529,
0.3005995750427246,
0.5004003643989563
]
}
},
"storage_device": "cpu",
"vision_encoder_name": "helper2424/resnet10",
"freeze_vision_encoder": true,
"image_encoder_hidden_dim": 32,
"shared_encoder": true,
"num_discrete_actions": 3,
"image_embedding_pooling_dim": 8,
"online_steps": 1000000,
"online_env_seed": 10000,
"online_buffer_capacity": 100000,
"offline_buffer_capacity": 100000,
"async_prefetch": false,
"online_step_before_learning": 100,
"policy_update_freq": 1,
"discount": 0.97,
"temperature_init": 0.01,
"num_critics": 2,
"num_subsample_critics": null,
"critic_lr": 0.0003,
"actor_lr": 0.0003,
"temperature_lr": 0.0003,
"critic_target_update_weight": 0.005,
"utd_ratio": 2,
"state_encoder_hidden_dim": 256,
"latent_dim": 64,
"target_entropy": null,
"use_backup_entropy": true,
"grad_clip_norm": 10.0,
"critic_network_kwargs": {
"hidden_dims": [
256,
256
],
"activate_final": true,
"final_activation": null
},
"actor_network_kwargs": {
"hidden_dims": [
256,
256
],
"activate_final": true
},
"policy_kwargs": {
"use_tanh_squash": true,
"std_min": 1e-05,
"std_max": 5.0,
"init_final": 0.05
},
"discrete_critic_network_kwargs": {
"hidden_dims": [
256,
256
],
"activate_final": true,
"final_activation": null
},
"actor_learner_config": {
"learner_host": "127.0.0.1",
"learner_port": 50051,
"policy_parameters_push_frequency": 4,
"queue_get_timeout": 2
},
"concurrency": {
"actor": "threads",
"learner": "threads"
},
"use_torch_compile": true
}