| { |
| "anneal_lr": true, |
| "batch_size": 2048, |
| "capture_video": false, |
| "clip_coef": 0.2, |
| "clip_vloss": true, |
| "cuda": true, |
| "ent_coef": 0.01, |
| "env_id": "LunarLander-v2", |
| "exp_name": "ppo", |
| "gae": true, |
| "gae_lambda": 0.95, |
| "gamma": 0.99, |
| "hf_token": "[REDACTED]", |
| "learning_rate": 0.00025, |
| "max_grad_norm": 0.5, |
| "minibatch_size": 256, |
| "norm_adv": true, |
| "num_envs": 8, |
| "num_minibatches": 8, |
| "num_steps": 256, |
| "num_updates": 244, |
| "push_to_hub": true, |
| "repo_id": "alexillovsky/ppo-LunarLander-v2-unit8", |
| "seed": 1, |
| "target_kl": null, |
| "torch_deterministic": true, |
| "total_timesteps": 500000, |
| "track": false, |
| "update_epochs": 4, |
| "vf_coef": 0.5, |
| "wandb_entity": null, |
| "wandb_project_name": "cleanRL" |
| } |