poca-SoccerTwos / run_logs /timers.json
Jobiniah's picture
First Push`
504ef56
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.852378010749817,
"min": 1.8350627422332764,
"max": 1.8768107891082764,
"count": 6
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 34913.62109375,
"min": 5941.634765625,
"max": 40539.11328125,
"count": 6
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 88.03636363636363,
"min": 29.666666666666668,
"max": 88.03636363636363,
"count": 6
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19368.0,
"min": 712.0,
"max": 20120.0,
"count": 6
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1192.4054277979922,
"min": 1190.8040054383152,
"max": 1201.2929666713765,
"count": 6
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 131164.59705777914,
"min": 14400.0,
"max": 189804.28873407748,
"count": 6
},
"SoccerTwos.Step.mean": {
"value": 10049991.0,
"min": 9999982.0,
"max": 10049991.0,
"count": 6
},
"SoccerTwos.Step.sum": {
"value": 10049991.0,
"min": 9999982.0,
"max": 10049991.0,
"count": 6
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.004964224062860012,
"min": -0.09364105761051178,
"max": 0.009783200919628143,
"count": 6
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 0.551028847694397,
"min": -2.561784267425537,
"max": 1.2131168842315674,
"count": 6
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.004720787517726421,
"min": -0.08726067841053009,
"max": 0.010965084657073021,
"count": 6
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 0.5240074396133423,
"min": -2.6891181468963623,
"max": 1.3596705198287964,
"count": 6
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 6
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 6
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.07192071923264512,
"min": -0.6030400037765503,
"max": 0.04130569221527596,
"count": 6
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -7.983199834823608,
"min": -42.29800021648407,
"max": 5.080600142478943,
"count": 6
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.07192071923264512,
"min": -0.6030400037765503,
"max": 0.04130569221527596,
"count": 6
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -7.983199834823608,
"min": -42.29800021648407,
"max": 5.080600142478943,
"count": 6
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 6
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 6
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.018015451532725515,
"min": 0.018015451532725515,
"max": 0.019700842688325792,
"count": 2
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.018015451532725515,
"min": 0.018015451532725515,
"max": 0.019700842688325792,
"count": 2
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.07724483733375867,
"min": 0.07724483733375867,
"max": 0.09004426474372546,
"count": 2
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.07724483733375867,
"min": 0.07724483733375867,
"max": 0.09004426474372546,
"count": 2
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.07705125908056895,
"min": 0.07705125908056895,
"max": 0.09023706714312235,
"count": 2
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.07705125908056895,
"min": 0.07705125908056895,
"max": 0.09023706714312235,
"count": 2
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 5.875427021492605e-07,
"min": 5.875427021492605e-07,
"max": 2.026965382089537e-06,
"count": 2
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 5.875427021492605e-07,
"min": 5.875427021492605e-07,
"max": 2.026965382089537e-06,
"count": 2
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.10008392039800995,
"min": 0.10008392039800995,
"max": 0.10028955223880595,
"count": 2
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.10008392039800995,
"min": 0.10008392039800995,
"max": 0.10028955223880595,
"count": 2
},
"SoccerTwos.Policy.Beta.mean": {
"value": 1.4187627860696568e-05,
"min": 1.4187627860696568e-05,
"max": 2.444865671641781e-05,
"count": 2
},
"SoccerTwos.Policy.Beta.sum": {
"value": 1.4187627860696568e-05,
"min": 1.4187627860696568e-05,
"max": 2.444865671641781e-05,
"count": 2
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1700259473",
"python_version": "3.10.12 | packaged by Anaconda, Inc. | (main, Jul 5 2023, 19:01:18) [MSC v.1916 64 bit (AMD64)]",
"command_line_arguments": "\\\\?\\C:\\Users\\Jonat\\anaconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.1.1+cpu",
"numpy_version": "1.23.5",
"end_time_seconds": "1700259659"
},
"total": 185.82584489999863,
"count": 1,
"self": 0.7753106999880401,
"children": {
"run_training.setup": {
"total": 0.09379280000575818,
"count": 1,
"self": 0.09379280000575818
},
"TrainerController.start_learning": {
"total": 184.95674140000483,
"count": 1,
"self": 0.08903199959604535,
"children": {
"TrainerController._reset_env": {
"total": 5.969565200008219,
"count": 2,
"self": 5.969565200008219
},
"TrainerController.advance": {
"total": 178.67253850038105,
"count": 3443,
"self": 0.07832270073413383,
"children": {
"env_step": {
"total": 64.80500039977778,
"count": 3443,
"self": 49.44157259988424,
"children": {
"SubprocessEnvManager._take_step": {
"total": 15.305126899955212,
"count": 3443,
"self": 0.39619699952891096,
"children": {
"TorchPolicy.evaluate": {
"total": 14.908929900426301,
"count": 6352,
"self": 14.908929900426301
}
}
},
"workers": {
"total": 0.058300899938330986,
"count": 3443,
"self": 0.0,
"children": {
"worker_root": {
"total": 179.18925629938894,
"count": 3443,
"is_parallel": true,
"self": 139.73535029958293,
"children": {
"steps_from_proto": {
"total": 0.004917600002954714,
"count": 4,
"is_parallel": true,
"self": 0.0007504000095650554,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.004167199993389659,
"count": 16,
"is_parallel": true,
"self": 0.004167199993389659
}
}
},
"UnityEnvironment.step": {
"total": 39.448988399803056,
"count": 3443,
"is_parallel": true,
"self": 1.9205469998996705,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 1.6575815995165613,
"count": 3443,
"is_parallel": true,
"self": 1.6575815995165613
},
"communicator.exchange": {
"total": 29.456260600389214,
"count": 3443,
"is_parallel": true,
"self": 29.456260600389214
},
"steps_from_proto": {
"total": 6.41459919999761,
"count": 6886,
"is_parallel": true,
"self": 1.2085421001102077,
"children": {
"_process_rank_one_or_two_observation": {
"total": 5.206057099887403,
"count": 27544,
"is_parallel": true,
"self": 5.206057099887403
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 113.78921539986914,
"count": 3443,
"self": 0.7887009992264211,
"children": {
"process_trajectory": {
"total": 20.89631270064274,
"count": 3443,
"self": 20.71150490063883,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1848078000039095,
"count": 1,
"self": 0.1848078000039095
}
}
},
"_update_policy": {
"total": 92.10420169999998,
"count": 2,
"self": 7.926415099966107,
"children": {
"TorchPOCAOptimizer.update": {
"total": 84.17778660003387,
"count": 60,
"self": 84.17778660003387
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.00000761449337e-06,
"count": 1,
"self": 1.00000761449337e-06
},
"TrainerController._save_models": {
"total": 0.2256047000118997,
"count": 1,
"self": 0.05978990001312923,
"children": {
"RLTrainer._checkpoint": {
"total": 0.16581479999877047,
"count": 1,
"self": 0.16581479999877047
}
}
}
}
}
}
}