ONNX
Safetensors
LTransition's picture
Upload folder using huggingface_hub
ad16c0e verified
{
"name": "FBcprAuxModel",
"device": "cuda",
"archi": {
"name": "FBcprAuxModelArchiConfig",
"z_dim": 256,
"norm_z": true,
"f": {
"name": "ForwardArchi",
"hidden_dim": 2048,
"model": "residual",
"hidden_layers": 6,
"embedding_layers": 2,
"num_parallel": 2,
"ensemble_mode": "batch",
"input_filter": {
"name": "DictInputFilterConfig",
"key": [
"state",
"privileged_state",
"last_action",
"history_actor"
]
}
},
"b": {
"name": "BackwardArchi",
"hidden_dim": 256,
"hidden_layers": 1,
"norm": true,
"input_filter": {
"name": "DictInputFilterConfig",
"key": [
"state",
"privileged_state"
]
}
},
"actor": {
"name": "actor",
"model": "residual",
"hidden_dim": 2048,
"hidden_layers": 6,
"embedding_layers": 2,
"input_filter": {
"name": "DictInputFilterConfig",
"key": [
"state",
"last_action",
"history_actor"
]
}
},
"critic": {
"name": "ForwardArchi",
"hidden_dim": 2048,
"model": "residual",
"hidden_layers": 6,
"embedding_layers": 2,
"num_parallel": 2,
"ensemble_mode": "batch",
"input_filter": {
"name": "DictInputFilterConfig",
"key": [
"state",
"privileged_state",
"last_action",
"history_actor"
]
}
},
"discriminator": {
"name": "DiscriminatorArchi",
"hidden_dim": 1024,
"hidden_layers": 3,
"input_filter": {
"name": "DictInputFilterConfig",
"key": [
"state",
"privileged_state"
]
}
},
"aux_critic": {
"name": "ForwardArchi",
"hidden_dim": 2048,
"model": "residual",
"hidden_layers": 6,
"embedding_layers": 2,
"num_parallel": 2,
"ensemble_mode": "batch",
"input_filter": {
"name": "DictInputFilterConfig",
"key": [
"state",
"privileged_state",
"last_action",
"history_actor"
]
}
}
},
"obs_normalizer": {
"name": "ObsNormalizerConfig",
"normalizers": {
"state": {
"name": "BatchNormNormalizerConfig",
"momentum": 0.01
},
"privileged_state": {
"name": "BatchNormNormalizerConfig",
"momentum": 0.01
},
"last_action": {
"name": "BatchNormNormalizerConfig",
"momentum": 0.01
},
"history_actor": {
"name": "BatchNormNormalizerConfig",
"momentum": 0.01
}
},
"allow_mismatching_keys": true
},
"inference_batch_size": 500000,
"seq_length": 8,
"actor_std": 0.05,
"amp": false,
"norm_aux_reward": {
"name": "RewardNormalizer",
"translate": false,
"scale": true
}
}