ppo-Huggy / run_logs /training_status.json
Muhammad Saqib
train on additional 1m steps
550b646 verified
{
"Huggy": {
"checkpoints": [
{
"steps": 799987,
"file_path": "results/Huggy/Huggy/Huggy-799987.onnx",
"reward": 3.6473917050741207,
"creation_time": 1707227362.1068056,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-799987.pt"
]
},
{
"steps": 999973,
"file_path": "results/Huggy/Huggy/Huggy-999973.onnx",
"reward": 3.8706098375186113,
"creation_time": 1707227603.8704143,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-999973.pt"
]
},
{
"steps": 1199906,
"file_path": "results/Huggy/Huggy/Huggy-1199906.onnx",
"reward": 3.791574968418605,
"creation_time": 1707227845.6743715,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1199906.pt"
]
},
{
"steps": 1399996,
"file_path": "results/Huggy/Huggy/Huggy-1399996.onnx",
"reward": 3.7729330327775745,
"creation_time": 1707228088.1357036,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1399996.pt"
]
},
{
"steps": 1599909,
"file_path": "results/Huggy/Huggy/Huggy-1599909.onnx",
"reward": 3.7626003322092076,
"creation_time": 1707228327.2294302,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1599909.pt"
]
},
{
"steps": 1799928,
"file_path": "results/Huggy/Huggy/Huggy-1799928.onnx",
"reward": 3.8987243901128354,
"creation_time": 1707228571.109829,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1799928.pt"
]
},
{
"steps": 1999987,
"file_path": "results/Huggy/Huggy/Huggy-1999987.onnx",
"reward": 4.328619424943571,
"creation_time": 1707228816.591017,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-1999987.pt"
]
},
{
"steps": 2000079,
"file_path": "results/Huggy/Huggy/Huggy-2000079.onnx",
"reward": 4.344622765887867,
"creation_time": 1707228816.7219145,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2000079.pt"
]
},
{
"steps": 2000079,
"file_path": "results/Huggy/Huggy/Huggy-2000079.onnx",
"reward": null,
"creation_time": 1707229532.083456,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2000079.pt"
]
},
{
"steps": 2199970,
"file_path": "results/Huggy/Huggy/Huggy-2199970.onnx",
"reward": 3.867090335268995,
"creation_time": 1707229928.373752,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2199970.pt"
]
},
{
"steps": 2399874,
"file_path": "results/Huggy/Huggy/Huggy-2399874.onnx",
"reward": 4.00003276743106,
"creation_time": 1707230173.364886,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2399874.pt"
]
},
{
"steps": 2599974,
"file_path": "results/Huggy/Huggy/Huggy-2599974.onnx",
"reward": 4.05236953496933,
"creation_time": 1707230418.801743,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2599974.pt"
]
},
{
"steps": 2799921,
"file_path": "results/Huggy/Huggy/Huggy-2799921.onnx",
"reward": 3.8115060528119407,
"creation_time": 1707230660.7077575,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2799921.pt"
]
},
{
"steps": 2999908,
"file_path": "results/Huggy/Huggy/Huggy-2999908.onnx",
"reward": 3.62165554612875,
"creation_time": 1707230902.9507375,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-2999908.pt"
]
},
{
"steps": 3000012,
"file_path": "results/Huggy/Huggy/Huggy-3000012.onnx",
"reward": 3.630279859052087,
"creation_time": 1707230903.0828722,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-3000012.pt"
]
}
],
"final_checkpoint": {
"steps": 3000012,
"file_path": "results/Huggy/Huggy.onnx",
"reward": 3.630279859052087,
"creation_time": 1707230903.0828722,
"auxillary_file_paths": [
"results/Huggy/Huggy/Huggy-3000012.pt"
]
}
},
"metadata": {
"stats_format_version": "0.3.0",
"mlagents_version": "1.1.0.dev0",
"torch_version": "2.2.0+cu121"
}
}