# Parameters for Actor: # ============================================================================== Actor.activation = 'leaky_relu' Actor.cont_dist_kind = 'normal' Actor.d_hidden = 300 Actor.dropout_p = 0.0 Actor.gmm_modes = 5 Actor.log_std_high = 2.0 Actor.log_std_low = -5.0 Actor.n_layers = 2 # Parameters for Agent: # ============================================================================== Agent.fake_filter = False Agent.gamma = 0.999 Agent.num_critics = 4 Agent.num_critics_td = 2 Agent.offline_coeff = 1.0 Agent.online_coeff = 0.0 Agent.popart = True Agent.reward_multiplier = 10.0 Agent.tau = 0.003 Agent.use_multigamma = True Agent.use_target_actor = True # Parameters for Experiment: # ============================================================================== Experiment.batches_per_update = 1 Experiment.critic_loss_weight = 10.0 Experiment.env_mode = 'async' Experiment.force_reset_train_envs_every = None Experiment.grad_clip = 1.0 Experiment.has_replay_buffer_rights = True Experiment.l2_coeff = 0.001 Experiment.learning_rate = 0.0001 Experiment.local_time_optimizer = False Experiment.lr_warmup_steps = 500 Experiment.mixed_precision = 'no' Experiment.padded_sampling = 'none' Experiment.save_trajs_as = 'npz' Experiment.stagger_traj_file_lengths = True Experiment.wandb_group_name = None # Parameters for FlashAttention: # ============================================================================== FlashAttention.window_size = (-1, -1) # Parameters for MetamonTstepEncoder: # ============================================================================== MetamonTstepEncoder.d_model = 100 MetamonTstepEncoder.extra_emb_dim = 18 MetamonTstepEncoder.n_heads = 5 MetamonTstepEncoder.n_layers = 3 MetamonTstepEncoder.scratch_tokens = 4 MetamonTstepEncoder.token_mask_aug = False # Parameters for Multigammas: # ============================================================================== Multigammas.continuous = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995] Multigammas.discrete = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995] # Parameters for MultiModalEmbedding: # ============================================================================== MultiModalEmbedding.dropout = 0.05 MultiModalEmbedding.numerical_tokens = 6 # Parameters for NCritics: # ============================================================================== NCritics.activation = 'leaky_relu' NCritics.d_hidden = 300 NCritics.dropout_p = 0.0 NCritics.n_layers = 2 # Parameters for PopArtLayer: # ============================================================================== PopArtLayer.beta = 0.0005 PopArtLayer.init_nu = 100.0 # Parameters for TformerTrajEncoder: # ============================================================================== TformerTrajEncoder.activation = 'leaky_relu' TformerTrajEncoder.causal = True TformerTrajEncoder.d_ff = 2048 TformerTrajEncoder.d_model = 512 TformerTrajEncoder.dropout_attn = 0.0 TformerTrajEncoder.dropout_emb = 0.05 TformerTrajEncoder.dropout_ff = 0.05 TformerTrajEncoder.dropout_qkv = 0.0 TformerTrajEncoder.head_scaling = True TformerTrajEncoder.n_heads = 8 TformerTrajEncoder.n_layers = 3 TformerTrajEncoder.norm = 'layer' TformerTrajEncoder.normformer_norms = True TformerTrajEncoder.sigma_reparam = True # Parameters for TimestepTransformer: # ============================================================================== # None. # Parameters for TokenEmbedding: # ============================================================================== # None. # Parameters for TransformerTurnEmbedding: # ============================================================================== TransformerTurnEmbedding.dropout = 0.05