{ "anneal_lr": true, "batch_size": 2048, "capture_video": false, "clip_coef": 0.2, "clip_vloss": true, "cuda": true, "ent_coef": 0.01, "env_id": "LunarLander-v2", "exp_name": "ppo", "gae": true, "gae_lambda": 0.95, "gamma": 0.99, "hf_token": "[REDACTED]", "learning_rate": 0.00025, "max_grad_norm": 0.5, "minibatch_size": 256, "norm_adv": true, "num_envs": 8, "num_minibatches": 8, "num_steps": 256, "num_updates": 244, "push_to_hub": true, "repo_id": "alexillovsky/ppo-LunarLander-v2-unit8", "seed": 1, "target_kl": null, "torch_deterministic": true, "total_timesteps": 500000, "track": false, "update_epochs": 4, "vf_coef": 0.5, "wandb_entity": null, "wandb_project_name": "cleanRL" }