| { | |
| "hidden_sizes": [ | |
| 1024, | |
| 1024, | |
| 512, | |
| 256 | |
| ], | |
| "learning_rate": 0.002, | |
| "batch_size": 2048, | |
| "num_epochs": 40, | |
| "num_iterations": 2000, | |
| "value_loss_weight": 0.5, | |
| "cfr_warmup_iterations": 20, | |
| "initial_temperature": 2.0, | |
| "final_temperature": 0.1, | |
| "temperature_anneal_iters": 400, | |
| "advantage_clip": 10.0, | |
| "target_update_interval": 5, | |
| "target_polyak": 0.1, | |
| "gradient_clip_norm": 1.0, | |
| "l2_regularization": 1e-05, | |
| "gamma": 0.99, | |
| "eval_frequency": 10, | |
| "eval_episodes": 100, | |
| "num_envs": 8192, | |
| "num_traversals": 1000, | |
| "seed": 42 | |
| } |