| # Parameters for Actor: |
| # ============================================================================== |
| Actor.activation = 'leaky_relu' |
| Actor.cont_dist_kind = 'normal' |
| Actor.d_hidden = 300 |
| Actor.dropout_p = 0.0 |
| Actor.gmm_modes = 5 |
| Actor.log_std_high = 2.0 |
| Actor.log_std_low = -5.0 |
| Actor.n_layers = 2 |
|
|
| # Parameters for Agent: |
| # ============================================================================== |
| Agent.fake_filter = False |
| Agent.gamma = 0.999 |
| Agent.num_critics = 4 |
| Agent.num_critics_td = 2 |
| Agent.offline_coeff = 1.0 |
| Agent.online_coeff = 0.0 |
| Agent.popart = True |
| Agent.reward_multiplier = 10.0 |
| Agent.tau = 0.003 |
| Agent.use_multigamma = True |
| Agent.use_target_actor = True |
|
|
| # Parameters for Experiment: |
| # ============================================================================== |
| Experiment.batches_per_update = 1 |
| Experiment.critic_loss_weight = 10.0 |
| Experiment.env_mode = 'async' |
| Experiment.force_reset_train_envs_every = None |
| Experiment.grad_clip = 1.0 |
| Experiment.has_replay_buffer_rights = True |
| Experiment.l2_coeff = 0.001 |
| Experiment.learning_rate = 0.0001 |
| Experiment.local_time_optimizer = False |
| Experiment.lr_warmup_steps = 500 |
| Experiment.mixed_precision = 'no' |
| Experiment.padded_sampling = 'none' |
| Experiment.save_trajs_as = 'npz' |
| Experiment.stagger_traj_file_lengths = True |
| Experiment.wandb_group_name = None |
|
|
| # Parameters for FlashAttention: |
| # ============================================================================== |
| FlashAttention.window_size = (-1, -1) |
|
|
| # Parameters for MetamonTstepEncoder: |
| # ============================================================================== |
| MetamonTstepEncoder.d_model = 100 |
| MetamonTstepEncoder.extra_emb_dim = 18 |
| MetamonTstepEncoder.n_heads = 5 |
| MetamonTstepEncoder.n_layers = 3 |
| MetamonTstepEncoder.scratch_tokens = 4 |
| MetamonTstepEncoder.token_mask_aug = False |
|
|
| # Parameters for Multigammas: |
| # ============================================================================== |
| Multigammas.continuous = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995] |
| Multigammas.discrete = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995] |
|
|
| # Parameters for MultiModalEmbedding: |
| # ============================================================================== |
| MultiModalEmbedding.dropout = 0.05 |
| MultiModalEmbedding.numerical_tokens = 6 |
|
|
| # Parameters for NCritics: |
| # ============================================================================== |
| NCritics.activation = 'leaky_relu' |
| NCritics.d_hidden = 300 |
| NCritics.dropout_p = 0.0 |
| NCritics.n_layers = 2 |
|
|
| # Parameters for PopArtLayer: |
| # ============================================================================== |
| PopArtLayer.beta = 0.0005 |
| PopArtLayer.init_nu = 100.0 |
|
|
| # Parameters for TformerTrajEncoder: |
| # ============================================================================== |
| TformerTrajEncoder.activation = 'leaky_relu' |
| TformerTrajEncoder.causal = True |
| TformerTrajEncoder.d_ff = 2048 |
| TformerTrajEncoder.d_model = 512 |
| TformerTrajEncoder.dropout_attn = 0.0 |
| TformerTrajEncoder.dropout_emb = 0.05 |
| TformerTrajEncoder.dropout_ff = 0.05 |
| TformerTrajEncoder.dropout_qkv = 0.0 |
| TformerTrajEncoder.head_scaling = True |
| TformerTrajEncoder.n_heads = 8 |
| TformerTrajEncoder.n_layers = 3 |
| TformerTrajEncoder.norm = 'layer' |
| TformerTrajEncoder.normformer_norms = True |
| TformerTrajEncoder.sigma_reparam = True |
|
|
| # Parameters for TimestepTransformer: |
| # ============================================================================== |
| # None. |
|
|
| # Parameters for TokenEmbedding: |
| # ============================================================================== |
| # None. |
|
|
| # Parameters for TransformerTurnEmbedding: |
| # ============================================================================== |
| TransformerTurnEmbedding.dropout = 0.05 |
|
|