| { | |
| "advantage_scaling": 3.0, | |
| "cem_iterations": 6, | |
| "consistency_coeff": 20.0, | |
| "discount": 0.98, | |
| "elite_weighting_temperature": 0.5, | |
| "expectile_weight": 0.9, | |
| "gaussian_mean_momentum": 0.1, | |
| "horizon": 5, | |
| "image_encoder_hidden_dim": 32, | |
| "input_normalization_modes": { | |
| "observation.environment_state": "min_max", | |
| "observation.state": "min_max" | |
| }, | |
| "input_shapes": { | |
| "observation.environment_state": [ | |
| 16 | |
| ], | |
| "observation.state": [ | |
| 2 | |
| ] | |
| }, | |
| "latent_dim": 50, | |
| "max_random_shift_ratio": 0.0476, | |
| "max_std": 2.0, | |
| "min_std": 0.05, | |
| "mlp_dim": 512, | |
| "n_action_repeats": 1, | |
| "n_action_steps": 5, | |
| "n_elites": 50, | |
| "n_gaussian_samples": 512, | |
| "n_pi_samples": 51, | |
| "output_normalization_modes": { | |
| "action": "min_max" | |
| }, | |
| "output_shapes": { | |
| "action": [ | |
| 2 | |
| ] | |
| }, | |
| "pi_coeff": 0.5, | |
| "q_ensemble_size": 5, | |
| "reward_coeff": 0.5, | |
| "state_encoder_hidden_dim": 256, | |
| "target_model_momentum": 0.995, | |
| "temporal_decay_coeff": 0.5, | |
| "uncertainty_regularizer_coeff": 1.0, | |
| "use_mpc": true, | |
| "value_coeff": 0.1 | |
| } |