| { | |
| "env_config": { | |
| "env_id": "Pendulum-v1", | |
| "env_kwargs": {}, | |
| "max_steps": null, | |
| "use_image": false, | |
| "vector_env_num": 6, | |
| "use_multi_processing": true, | |
| "image_shape": null, | |
| "frame_stack": 1, | |
| "frame_skip": 1, | |
| "training_render_mode": null | |
| }, | |
| "device": "cpu", | |
| "learning_rate": 0.0003, | |
| "gamma": 0.99, | |
| "checkpoint_pathname": "", | |
| "max_grad_norm": 0.5, | |
| "log_interval": 100, | |
| "eval_episodes": 50, | |
| "eval_random_seed": 42, | |
| "eval_video_num": 10, | |
| "total_steps": 120000, | |
| "hidden_sizes": [ | |
| 128, | |
| 128 | |
| ], | |
| "use_layer_norm": true, | |
| "critic_lr": 0.0003, | |
| "replay_buffer_capacity": 96000, | |
| "batch_size": 128, | |
| "update_start_step": 10000, | |
| "alpha": 0.2, | |
| "auto_tune_alpha": true, | |
| "alpha_lr": 0.0003, | |
| "target_entropy": -1.0, | |
| "tau": 0.005, | |
| "max_action": 2.0, | |
| "log_std_min": -20, | |
| "log_std_max": 2 | |
| } |