{ "name": "FBcprAuxModel", "device": "cuda", "archi": { "name": "FBcprAuxModelArchiConfig", "z_dim": 256, "norm_z": true, "f": { "name": "ForwardArchi", "hidden_dim": 2048, "model": "residual", "hidden_layers": 6, "embedding_layers": 2, "num_parallel": 2, "ensemble_mode": "batch", "input_filter": { "name": "DictInputFilterConfig", "key": [ "state", "privileged_state", "last_action", "history_actor" ] } }, "b": { "name": "BackwardArchi", "hidden_dim": 256, "hidden_layers": 1, "norm": true, "input_filter": { "name": "DictInputFilterConfig", "key": [ "state", "privileged_state" ] } }, "actor": { "name": "actor", "model": "residual", "hidden_dim": 2048, "hidden_layers": 6, "embedding_layers": 2, "input_filter": { "name": "DictInputFilterConfig", "key": [ "state", "last_action", "history_actor" ] } }, "critic": { "name": "ForwardArchi", "hidden_dim": 2048, "model": "residual", "hidden_layers": 6, "embedding_layers": 2, "num_parallel": 2, "ensemble_mode": "batch", "input_filter": { "name": "DictInputFilterConfig", "key": [ "state", "privileged_state", "last_action", "history_actor" ] } }, "discriminator": { "name": "DiscriminatorArchi", "hidden_dim": 1024, "hidden_layers": 3, "input_filter": { "name": "DictInputFilterConfig", "key": [ "state", "privileged_state" ] } }, "aux_critic": { "name": "ForwardArchi", "hidden_dim": 2048, "model": "residual", "hidden_layers": 6, "embedding_layers": 2, "num_parallel": 2, "ensemble_mode": "batch", "input_filter": { "name": "DictInputFilterConfig", "key": [ "state", "privileged_state", "last_action", "history_actor" ] } } }, "obs_normalizer": { "name": "ObsNormalizerConfig", "normalizers": { "state": { "name": "BatchNormNormalizerConfig", "momentum": 0.01 }, "privileged_state": { "name": "BatchNormNormalizerConfig", "momentum": 0.01 }, "last_action": { "name": "BatchNormNormalizerConfig", "momentum": 0.01 }, "history_actor": { "name": "BatchNormNormalizerConfig", "momentum": 0.01 } }, "allow_mismatching_keys": true }, "inference_batch_size": 500000, "seq_length": 8, "actor_std": 0.05, "amp": false, "norm_aux_reward": { "name": "RewardNormalizer", "translate": false, "scale": true } }