ppo-RND-Pyramids / run_logs /training_status.json
sgoodfriend's picture
Longer time horizon
88cd07d
{
"Pyramids": {
"checkpoints": [
{
"steps": 499781,
"file_path": "results/Pyramids2/Pyramids/Pyramids-499781.onnx",
"reward": 0.361799955368042,
"creation_time": 1673510707.2481713,
"auxillary_file_paths": [
"results/Pyramids2/Pyramids/Pyramids-499781.pt"
]
},
{
"steps": 999987,
"file_path": "results/Pyramids2/Pyramids/Pyramids-999987.onnx",
"reward": null,
"creation_time": 1673511534.2447195,
"auxillary_file_paths": [
"results/Pyramids2/Pyramids/Pyramids-999987.pt"
]
},
{
"steps": 1499905,
"file_path": "results/Pyramids2/Pyramids/Pyramids-1499905.onnx",
"reward": 1.824285694531032,
"creation_time": 1673512370.698666,
"auxillary_file_paths": [
"results/Pyramids2/Pyramids/Pyramids-1499905.pt"
]
},
{
"steps": 1500093,
"file_path": "results/Pyramids2/Pyramids/Pyramids-1500093.onnx",
"reward": 1.8228749781847,
"creation_time": 1673512370.8051713,
"auxillary_file_paths": [
"results/Pyramids2/Pyramids/Pyramids-1500093.pt"
]
}
],
"final_checkpoint": {
"steps": 1500093,
"file_path": "results/Pyramids2/Pyramids.onnx",
"reward": 1.8228749781847,
"creation_time": 1673512370.8051713,
"auxillary_file_paths": [
"results/Pyramids2/Pyramids/Pyramids-1500093.pt"
]
}
},
"metadata": {
"stats_format_version": "0.3.0",
"mlagents_version": "0.29.0.dev0",
"torch_version": "1.8.1+cu102"
}
}