ppo-Pyramids / run_logs /training_status.json
arkadyark's picture
First push, baseline model trained for 1M steps
d8286dd
{
"Pyramids": {
"checkpoints": [
{
"steps": 499893,
"file_path": "results/PyramidsTraining/Pyramids/Pyramids-499893.onnx",
"reward": 1.4394999742507935,
"creation_time": 1681694822.2118285,
"auxillary_file_paths": [
"results/PyramidsTraining/Pyramids/Pyramids-499893.pt"
]
},
{
"steps": 999925,
"file_path": "results/PyramidsTraining/Pyramids/Pyramids-999925.onnx",
"reward": 1.6051249895244837,
"creation_time": 1681695275.6527445,
"auxillary_file_paths": [
"results/PyramidsTraining/Pyramids/Pyramids-999925.pt"
]
},
{
"steps": 1000053,
"file_path": "results/PyramidsTraining/Pyramids/Pyramids-1000053.onnx",
"reward": 1.6051249895244837,
"creation_time": 1681695275.7144043,
"auxillary_file_paths": [
"results/PyramidsTraining/Pyramids/Pyramids-1000053.pt"
]
}
],
"final_checkpoint": {
"steps": 1000053,
"file_path": "results/PyramidsTraining/Pyramids.onnx",
"reward": 1.6051249895244837,
"creation_time": 1681695275.7144043,
"auxillary_file_paths": [
"results/PyramidsTraining/Pyramids/Pyramids-1000053.pt"
]
}
},
"metadata": {
"stats_format_version": "0.3.0",
"mlagents_version": "0.31.0.dev0",
"torch_version": "1.11.0+cu113"
}
}