| { |
| "type": "sac", |
| "n_obs_steps": 1, |
| "normalization_mapping": { |
| "VISUAL": "MEAN_STD", |
| "STATE": "MIN_MAX", |
| "ENV": "MIN_MAX", |
| "ACTION": "MIN_MAX" |
| }, |
| "input_features": { |
| "observation.images.front": { |
| "type": "VISUAL", |
| "shape": [ |
| 3, |
| 128, |
| 128 |
| ] |
| }, |
| "observation.images.wrist": { |
| "type": "VISUAL", |
| "shape": [ |
| 3, |
| 128, |
| 128 |
| ] |
| }, |
| "observation.state": { |
| "type": "STATE", |
| "shape": [ |
| 24 |
| ] |
| } |
| }, |
| "output_features": { |
| "action": { |
| "type": "ACTION", |
| "shape": [ |
| 3 |
| ] |
| } |
| }, |
| "device": "cuda", |
| "use_amp": false, |
| "push_to_hub": true, |
| "repo_id": "yfynb1111/realman_sac", |
| "private": null, |
| "tags": null, |
| "license": null, |
| "dataset_stats": { |
| "observation.images.front": { |
| "mean": [ |
| 0.485, |
| 0.456, |
| 0.406 |
| ], |
| "std": [ |
| 0.229, |
| 0.224, |
| 0.225 |
| ] |
| }, |
| "observation.images.wrist": { |
| "mean": [ |
| 0.485, |
| 0.456, |
| 0.406 |
| ], |
| "std": [ |
| 0.229, |
| 0.224, |
| 0.225 |
| ] |
| }, |
| "observation.state": { |
| "min": [ |
| -6.196000099182129, |
| -4.026000022888184, |
| 0.8740000128746033, |
| -0.7179999947547913, |
| 40.55500030517578, |
| 15.074999809265137, |
| -1.0, |
| -50.179996490478516, |
| -56.030006408691406, |
| -279.32000732421875, |
| -1.8899999856948853, |
| -76.80000305175781, |
| -53.25000762939453, |
| -9120.0, |
| -420.0, |
| -2560.0, |
| -2801.0, |
| -505.0, |
| -496.0, |
| -277.0, |
| -39.0, |
| -0.41315099596977234, |
| -0.1926412731409073, |
| 0.15596334636211395 |
| ], |
| "max": [ |
| 41.54800033569336, |
| 69.69300079345703, |
| 126.43599700927734, |
| 2.4509999752044678, |
| 112.39099884033203, |
| 64.21399688720703, |
| 1002.0, |
| 39.80998992919922, |
| 137.8900146484375, |
| 118.1100082397461, |
| 4.369999885559082, |
| 141.5899658203125, |
| 39.650001525878906, |
| 7380.0, |
| 387.0, |
| -296.0, |
| -416.0, |
| 489.0, |
| 319.0, |
| 265.0, |
| 2020.0, |
| -0.1841542273759842, |
| 0.02644500881433487, |
| 0.3053857386112213 |
| ] |
| } |
| }, |
| "storage_device": "cpu", |
| "vision_encoder_name": "helper2424/resnet10", |
| "freeze_vision_encoder": true, |
| "image_encoder_hidden_dim": 32, |
| "shared_encoder": true, |
| "num_discrete_actions": 3, |
| "image_embedding_pooling_dim": 8, |
| "online_steps": 1000000, |
| "online_env_seed": 10000, |
| "online_buffer_capacity": 80000, |
| "offline_buffer_capacity": 50000, |
| "async_prefetch": false, |
| "online_step_before_learning": 100, |
| "policy_update_freq": 1, |
| "discount": 0.97, |
| "temperature_init": 0.01, |
| "num_critics": 2, |
| "num_subsample_critics": null, |
| "critic_lr": 0.0003, |
| "actor_lr": 0.0003, |
| "temperature_lr": 0.0003, |
| "critic_target_update_weight": 0.005, |
| "utd_ratio": 2, |
| "state_encoder_hidden_dim": 256, |
| "latent_dim": 256, |
| "target_entropy": null, |
| "use_backup_entropy": true, |
| "grad_clip_norm": 10.0, |
| "critic_network_kwargs": { |
| "hidden_dims": [ |
| 256, |
| 256 |
| ], |
| "activate_final": true, |
| "final_activation": null |
| }, |
| "actor_network_kwargs": { |
| "hidden_dims": [ |
| 256, |
| 256 |
| ], |
| "activate_final": true |
| }, |
| "policy_kwargs": { |
| "use_tanh_squash": true, |
| "std_min": -5.0, |
| "std_max": 2.0, |
| "init_final": 0.05 |
| }, |
| "discrete_critic_network_kwargs": { |
| "hidden_dims": [ |
| 256, |
| 256 |
| ], |
| "activate_final": true, |
| "final_activation": null |
| }, |
| "actor_learner_config": { |
| "learner_host": "127.0.0.1", |
| "learner_port": 50051, |
| "policy_parameters_push_frequency": 4, |
| "queue_get_timeout": 2.0 |
| }, |
| "concurrency": { |
| "actor": "threads", |
| "learner": "threads" |
| }, |
| "use_torch_compile": true |
| } |