ppo-PyramidsRND / run_logs /training_status.json
reeeemo's picture
PPO agent playing PyramidsRND
44b96a1 verified
{
"Pyramids": {
"checkpoints": [
{
"steps": 499962,
"file_path": "results/Pyramids Training/Pyramids/Pyramids-499962.onnx",
"reward": -1.0000000521540642,
"creation_time": 1767221188.5490155,
"auxillary_file_paths": [
"results/Pyramids Training/Pyramids/Pyramids-499962.pt"
]
},
{
"steps": 999962,
"file_path": "results/Pyramids Training/Pyramids/Pyramids-999962.onnx",
"reward": 1.1782799690961838,
"creation_time": 1767222949.7782423,
"auxillary_file_paths": [
"results/Pyramids Training/Pyramids/Pyramids-999962.pt"
]
},
{
"steps": 1000051,
"file_path": "results/Pyramids Training/Pyramids/Pyramids-1000051.onnx",
"reward": 1.2792332967122395,
"creation_time": 1767222949.8643034,
"auxillary_file_paths": [
"results/Pyramids Training/Pyramids/Pyramids-1000051.pt"
]
}
],
"final_checkpoint": {
"steps": 1000051,
"file_path": "results/Pyramids Training/Pyramids.onnx",
"reward": 1.2792332967122395,
"creation_time": 1767222949.8643034,
"auxillary_file_paths": [
"results/Pyramids Training/Pyramids/Pyramids-1000051.pt"
]
}
},
"metadata": {
"stats_format_version": "0.3.0",
"mlagents_version": "1.2.0.dev0",
"torch_version": "2.8.0+cu128"
}
}