{ "env_config": { "env_id": "Pendulum-v1", "env_kwargs": {}, "max_steps": null, "use_image": false, "vector_env_num": 6, "use_multi_processing": true, "image_shape": null, "frame_stack": 1, "frame_skip": 1, "training_render_mode": null }, "device": "cpu", "learning_rate": 0.0003, "gamma": 0.99, "checkpoint_pathname": "", "max_grad_norm": 0.5, "log_interval": 100, "eval_episodes": 50, "eval_random_seed": 42, "eval_video_num": 10, "total_steps": 120000, "hidden_sizes": [ 128, 128 ], "use_layer_norm": true, "critic_lr": 0.0003, "replay_buffer_capacity": 96000, "batch_size": 128, "update_start_step": 10000, "alpha": 0.2, "auto_tune_alpha": true, "alpha_lr": 0.0003, "target_entropy": -1.0, "tau": 0.005, "max_action": 2.0, "log_std_min": -20, "log_std_max": 2 }