|
{ |
|
"name": "root", |
|
"gauges": { |
|
"Pyramids.Policy.Entropy.mean": { |
|
"value": 0.3509610891342163, |
|
"min": 0.3087957203388214, |
|
"max": 0.36777380108833313, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.Entropy.sum": { |
|
"value": 10590.6015625, |
|
"min": 3339.9345703125, |
|
"max": 11009.6767578125, |
|
"count": 14 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.mean": { |
|
"value": 261.5739130434783, |
|
"min": 208.8709677419355, |
|
"max": 333.15555555555557, |
|
"count": 14 |
|
}, |
|
"Pyramids.Environment.EpisodeLength.sum": { |
|
"value": 30081.0, |
|
"min": 6475.0, |
|
"max": 30810.0, |
|
"count": 14 |
|
}, |
|
"Pyramids.Step.mean": { |
|
"value": 1799967.0, |
|
"min": 1409913.0, |
|
"max": 1799967.0, |
|
"count": 14 |
|
}, |
|
"Pyramids.Step.sum": { |
|
"value": 1799967.0, |
|
"min": 1409913.0, |
|
"max": 1799967.0, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.6859020590782166, |
|
"min": 0.578832745552063, |
|
"max": 0.6859020590782166, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 200.2834014892578, |
|
"min": 53.8724479675293, |
|
"max": 200.2834014892578, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.mean": { |
|
"value": 21.957359313964844, |
|
"min": 2.9718246459960938, |
|
"max": 21.957359313964844, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.RndValueEstimate.sum": { |
|
"value": 6411.548828125, |
|
"min": 264.4924011230469, |
|
"max": 6411.548828125, |
|
"count": 14 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.mean": { |
|
"value": 1.720510334675682, |
|
"min": 1.629107512453551, |
|
"max": 1.7911290161071285, |
|
"count": 14 |
|
}, |
|
"Pyramids.Environment.CumulativeReward.sum": { |
|
"value": 199.5791988223791, |
|
"min": 55.524999499320984, |
|
"max": 199.5791988223791, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.mean": { |
|
"value": 1.720510334675682, |
|
"min": 1.629107512453551, |
|
"max": 1.7911290161071285, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.ExtrinsicReward.sum": { |
|
"value": 199.5791988223791, |
|
"min": 55.524999499320984, |
|
"max": 199.5791988223791, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.RndReward.mean": { |
|
"value": 0.22894134176172445, |
|
"min": 0.22894134176172445, |
|
"max": 0.3622605609319483, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.RndReward.sum": { |
|
"value": 26.557195644360036, |
|
"min": 7.3203921407694, |
|
"max": 32.60345048387535, |
|
"count": 14 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.mean": { |
|
"value": 0.07270944114134181, |
|
"min": 0.06266858351548708, |
|
"max": 0.07270944114134181, |
|
"count": 14 |
|
}, |
|
"Pyramids.Losses.PolicyLoss.sum": { |
|
"value": 1.0179321759787854, |
|
"min": 0.27831401882576756, |
|
"max": 1.0420461169269402, |
|
"count": 14 |
|
}, |
|
"Pyramids.Losses.ValueLoss.mean": { |
|
"value": 21.68147027705397, |
|
"min": 0.471697402519307, |
|
"max": 21.68147027705397, |
|
"count": 14 |
|
}, |
|
"Pyramids.Losses.ValueLoss.sum": { |
|
"value": 303.54058387875557, |
|
"min": 1.9932998442091048, |
|
"max": 303.54058387875557, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.LearningRate.mean": { |
|
"value": 2.424611096591275e-06, |
|
"min": 2.424611096591275e-06, |
|
"max": 6.578182807274999e-05, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.LearningRate.sum": { |
|
"value": 3.394455535227785e-05, |
|
"min": 3.394455535227785e-05, |
|
"max": 0.0008766917744364446, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.Epsilon.mean": { |
|
"value": 0.10080817063492063, |
|
"min": 0.10080817063492063, |
|
"max": 0.12192725000000001, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.Epsilon.sum": { |
|
"value": 1.4113143888888888, |
|
"min": 0.48770900000000006, |
|
"max": 1.7875094444444446, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.Beta.mean": { |
|
"value": 9.073624642857163e-05, |
|
"min": 9.073624642857163e-05, |
|
"max": 0.002200532275, |
|
"count": 14 |
|
}, |
|
"Pyramids.Policy.Beta.sum": { |
|
"value": 0.0012703074500000028, |
|
"min": 0.0012703074500000028, |
|
"max": 0.0293337992, |
|
"count": 14 |
|
}, |
|
"Pyramids.Losses.RNDLoss.mean": { |
|
"value": 0.027669908478856087, |
|
"min": 0.027669908478856087, |
|
"max": 0.03692689538002014, |
|
"count": 14 |
|
}, |
|
"Pyramids.Losses.RNDLoss.sum": { |
|
"value": 0.3873787224292755, |
|
"min": 0.14770758152008057, |
|
"max": 0.49223601818084717, |
|
"count": 14 |
|
}, |
|
"Pyramids.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 14 |
|
}, |
|
"Pyramids.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 14 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1728319279", |
|
"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]", |
|
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
|
"mlagents_version": "1.2.0.dev0", |
|
"mlagents_envs_version": "1.2.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.4.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1728320196" |
|
}, |
|
"total": 916.5547743960005, |
|
"count": 1, |
|
"self": 1.1799581080003918, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.06476543600001605, |
|
"count": 1, |
|
"self": 0.06476543600001605 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 915.3100508520001, |
|
"count": 1, |
|
"self": 0.5411470719573117, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 2.24071387100048, |
|
"count": 1, |
|
"self": 2.24071387100048 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 912.4310510820433, |
|
"count": 26117, |
|
"self": 0.5757557350352727, |
|
"children": { |
|
"env_step": { |
|
"total": 710.9093044849951, |
|
"count": 26117, |
|
"self": 649.9562996429831, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 60.62759578393161, |
|
"count": 26117, |
|
"self": 1.8369352299632737, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 58.79066055396834, |
|
"count": 25071, |
|
"self": 58.79066055396834 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 0.3254090580803677, |
|
"count": 26117, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 913.3407672259527, |
|
"count": 26117, |
|
"is_parallel": true, |
|
"self": 311.62826983305786, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0031315679998442647, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0009635180003897403, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0021680499994545244, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0021680499994545244 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.09401083200009452, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006287340002018027, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0005019809996156255, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005019809996156255 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.09124633700048435, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.09124633700048435 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0016337799997927505, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003371640004843357, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0012966159993084148, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0012966159993084148 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 601.7124973928949, |
|
"count": 26116, |
|
"is_parallel": true, |
|
"self": 13.173401732853563, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 9.298754634973193, |
|
"count": 26116, |
|
"is_parallel": true, |
|
"self": 9.298754634973193 |
|
}, |
|
"communicator.exchange": { |
|
"total": 539.8244959001067, |
|
"count": 26116, |
|
"is_parallel": true, |
|
"self": 539.8244959001067 |
|
}, |
|
"steps_from_proto": { |
|
"total": 39.41584512496138, |
|
"count": 26116, |
|
"is_parallel": true, |
|
"self": 8.129025020915833, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 31.286820104045546, |
|
"count": 208928, |
|
"is_parallel": true, |
|
"self": 31.286820104045546 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 200.94599086201288, |
|
"count": 26117, |
|
"self": 1.07309663295473, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 54.34334475605556, |
|
"count": 26117, |
|
"self": 54.253657134056084, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.08968762199947378, |
|
"count": 1, |
|
"self": 0.08968762199947378 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 145.5295494730026, |
|
"count": 189, |
|
"self": 81.035269021967, |
|
"children": { |
|
"TorchPPOOptimizer.update": { |
|
"total": 64.49428045103559, |
|
"count": 6066, |
|
"self": 64.49428045103559 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 1.5699997675255872e-06, |
|
"count": 1, |
|
"self": 1.5699997675255872e-06 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.09713725699930364, |
|
"count": 1, |
|
"self": 0.0016087909989437321, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.09552846600035991, |
|
"count": 1, |
|
"self": 0.09552846600035991 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |