ppo-Huggy / run_logs /training_status.json
devjwsong's picture
Trained the first Huggy agent based on PPO.
3e3e5e7 verified
{
"Huggy": {
"checkpoints": [
{
"steps": 199870,
"file_path": "results/Huggy/Huggy/Huggy-199870.onnx",
"reward": 3.239726749019346,
"creation_time": 1706752778.3750024,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-199870.pt"
]
},
{
"steps": 399961,
"file_path": "results/Huggy/Huggy/Huggy-399961.onnx",
"reward": 3.953016260214019,
"creation_time": 1706753035.0462224,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-399961.pt"
]
},
{
"steps": 599951,
"file_path": "results/Huggy/Huggy/Huggy-599951.onnx",
"reward": 4.068377274274826,
"creation_time": 1706753293.9180725,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-599951.pt"
]
},
{
"steps": 799965,
"file_path": "results/Huggy/Huggy/Huggy-799965.onnx",
"reward": 4.229364575795185,
"creation_time": 1706753551.395465,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-799965.pt"
]
},
{
"steps": 999974,
"file_path": "results/Huggy/Huggy/Huggy-999974.onnx",
"reward": 3.623603868054914,
"creation_time": 1706753809.868829,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-999974.pt"
]
},
{
"steps": 1199949,
"file_path": "results/Huggy/Huggy/Huggy-1199949.onnx",
"reward": 3.3977674815965737,
"creation_time": 1706754068.7863774,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1199949.pt"
]
},
{
"steps": 1399956,
"file_path": "results/Huggy/Huggy/Huggy-1399956.onnx",
"reward": 3.8804917310789433,
"creation_time": 1706754324.0964925,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1399956.pt"
]
},
{
"steps": 1599989,
"file_path": "results/Huggy/Huggy/Huggy-1599989.onnx",
"reward": 3.6322373390197753,
"creation_time": 1706754558.731017,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1599989.pt"
]
},
{
"steps": 1799927,
"file_path": "results/Huggy/Huggy/Huggy-1799927.onnx",
"reward": 3.7924101460547672,
"creation_time": 1706754788.9555855,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1799927.pt"
]
},
{
"steps": 1999989,
"file_path": "results/Huggy/Huggy/Huggy-1999989.onnx",
"reward": 4.153508087863093,
"creation_time": 1706755022.321119,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1999989.pt"
]
},
{
"steps": 2000026,
"file_path": "results/Huggy/Huggy/Huggy-2000026.onnx",
"reward": 4.0362441291411715,
"creation_time": 1706755022.4348104,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2000026.pt"
]
}
],
"final_checkpoint": {
"steps": 2000026,
"file_path": "results/Huggy/Huggy.onnx",
"reward": 4.0362441291411715,
"creation_time": 1706755022.4348104,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2000026.pt"
]
}
},
"metadata": {
"stats_format_version": "0.3.0",
"mlagents_version": "1.1.0.dev0",
"torch_version": "2.2.0+cu121"
}
}