First model

4b154ca almost 2 years ago

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.190852552652359,
	"min": 0.190852552652359,
	"max": 1.4776930809020996,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 5789.703125,
	"min": 5789.703125,
	"max": 44827.296875,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999907.0,
	"min": 29875.0,
	"max": 2999907.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999907.0,
	"min": 29875.0,
	"max": 2999907.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.8032809495925903,
	"min": -0.10419106483459473,
	"max": 0.8913851976394653,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 245.80397033691406,
	"min": -25.005855560302734,
	"max": 269.1983337402344,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.01829381287097931,
	"min": -0.058316152542829514,
	"max": 0.35751619935035706,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 5.597906589508057,
	"min": -15.162199974060059,
	"max": 84.73133850097656,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06659412673200547,
	"min": 0.0643410952643968,
	"max": 0.07499158209100812,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9323177742480766,
	"min": 0.599932656728065,
	"max": 1.1135934102440288,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.016800466954702557,
	"min": 4.7188830995680745e-05,
	"max": 0.016800466954702557,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.23520653736583577,
	"min": 0.0006134548029438497,
	"max": 0.24805232497872604,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.459406656421433e-06,
	"min": 1.459406656421433e-06,
	"max": 0.0002982828880723708,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.043169318990006e-05,
	"min": 2.043169318990006e-05,
	"max": 0.003759127546957533,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10048643571428571,
	"min": 0.10048643571428571,
	"max": 0.19942762916666668,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4068101,
	"min": 1.4068101,
	"max": 2.6924080000000004,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 5.8594927857143e-05,
	"min": 5.8594927857143e-05,
	"max": 0.00994282015375,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008203289900000021,
	"min": 0.0008203289900000021,
	"max": 0.12531894242,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.005474121309816837,
	"min": 0.005421524867415428,
	"max": 0.3707958459854126,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.07663770020008087,
	"min": 0.0760587528347969,
	"max": 2.966366767883301,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 208.64383561643837,
	"min": 201.45774647887325,
	"max": 999.0,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30462.0,
	"min": 16290.0,
	"max": 32824.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7758652939885653,
	"min": -0.9999600519736608,
	"max": 1.7977132760769838,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 261.0521982163191,
	"min": -30.997601605951786,
	"max": 261.0521982163191,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7758652939885653,
	"min": -0.9999600519736608,
	"max": 1.7977132760769838,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 261.0521982163191,
	"min": -30.997601605951786,
	"max": 261.0521982163191,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.01208297944255292,
	"min": 0.01165229568458289,
	"max": 7.72331192475908,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.7761979780552792,
	"min": 1.6230957971565658,
	"max": 131.29630272090435,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1674244483",
	"python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1674250896"
	},
	"total": 6413.5053127930005,
	"count": 1,
	"self": 0.37370159399961267,
	"children": {
	"run_training.setup": {
	"total": 0.1483111969998845,
	"count": 1,
	"self": 0.1483111969998845
	},
	"TrainerController.start_learning": {
	"total": 6412.983300002001,
	"count": 1,
	"self": 4.227269895247446,
	"children": {
	"TrainerController._reset_env": {
	"total": 5.628078054999833,
	"count": 1,
	"self": 5.628078054999833
	},
	"TrainerController.advance": {
	"total": 6403.018641285754,
	"count": 194827,
	"self": 4.510763544407382,
	"children": {
	"env_step": {
	"total": 3928.891123245172,
	"count": 194827,
	"self": 3522.4936965011116,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 403.7743198919993,
	"count": 194827,
	"self": 15.311660703165217,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 388.4626591888341,
	"count": 187562,
	"self": 137.79051260383244,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 250.67214658500166,
	"count": 187562,
	"self": 250.67214658500166
	}
	}
	}
	}
	},
	"workers": {
	"total": 2.623106852061028,
	"count": 194827,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 6404.38730032729,
	"count": 194827,
	"is_parallel": true,
	"self": 3207.7228859144066,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.00232741700006045,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007688670000334241,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015585500000270258,
	"count": 8,
	"is_parallel": true,
	"self": 0.0015585500000270258
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04378473899987512,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003437779998876067,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005886379999537894,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005886379999537894
	},
	"communicator.exchange": {
	"total": 0.04158878199996252,
	"count": 1,
	"is_parallel": true,
	"self": 0.04158878199996252
	},
	"steps_from_proto": {
	"total": 0.0012635410000712,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003277290002188238,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0009358119998523762,
	"count": 8,
	"is_parallel": true,
	"self": 0.0009358119998523762
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 3196.6644144128836,
	"count": 194826,
	"is_parallel": true,
	"self": 66.7227202963436,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 53.87475066277625,
	"count": 194826,
	"is_parallel": true,
	"self": 53.87475066277625
	},
	"communicator.exchange": {
	"total": 2838.273514727004,
	"count": 194826,
	"is_parallel": true,
	"self": 2838.273514727004
	},
	"steps_from_proto": {
	"total": 237.7934287267601,
	"count": 194826,
	"is_parallel": true,
	"self": 61.241649386461404,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 176.5517793402987,
	"count": 1558608,
	"is_parallel": true,
	"self": 176.5517793402987
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2469.6167544961745,
	"count": 194827,
	"self": 7.22526182844922,
	"children": {
	"process_trajectory": {
	"total": 533.7097957147307,
	"count": 194827,
	"self": 533.02035039273,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.6894453220006653,
	"count": 6,
	"self": 0.6894453220006653
	}
	}
	},
	"_update_policy": {
	"total": 1928.6816969529943,
	"count": 1389,
	"self": 680.729455620942,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 1247.9522413320524,
	"count": 68433,
	"self": 1247.9522413320524
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.035999957821332e-06,
	"count": 1,
	"self": 1.035999957821332e-06
	},
	"TrainerController._save_models": {
	"total": 0.10930972999994992,
	"count": 1,
	"self": 0.0015776340005686507,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.10773209599938127,
	"count": 1,
	"self": 0.10773209599938127
	}
	}
	}
	}
	}
	}
	}