| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.29054930806159973, |
| "min": 0.23329854011535645, |
| "max": 1.3596144914627075, |
| "count": 122 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 8595.6103515625, |
| "min": 7028.818359375, |
| "max": 41245.265625, |
| "count": 122 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 3659882.0, |
| "min": 29931.0, |
| "max": 3659882.0, |
| "count": 122 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 3659882.0, |
| "min": 29931.0, |
| "max": 3659882.0, |
| "count": 122 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.8309521675109863, |
| "min": -0.14771369099617004, |
| "max": 0.8955442309379578, |
| "count": 122 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 256.76422119140625, |
| "min": -35.5989990234375, |
| "max": 277.61871337890625, |
| "count": 122 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.005796498153358698, |
| "min": -0.020980294793844223, |
| "max": 0.4695992171764374, |
| "count": 122 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 1.7911179065704346, |
| "min": -6.252127647399902, |
| "max": 111.29501342773438, |
| "count": 122 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06827977287632944, |
| "min": 0.06430021362307127, |
| "max": 0.08033802269797195, |
| "count": 122 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9559168202686122, |
| "min": 0.5681599113328735, |
| "max": 1.1247323177716073, |
| "count": 122 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.015933373510571464, |
| "min": 0.00048440896773078735, |
| "max": 0.01664026495598678, |
| "count": 122 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.2230672291480005, |
| "min": 0.006781725548231023, |
| "max": 0.23296370938381492, |
| "count": 122 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 0.00019066262573151784, |
| "min": 0.00019066262573151784, |
| "max": 0.00029948420642193123, |
| "count": 122 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.0026692767602412497, |
| "min": 0.00239587365137545, |
| "max": 0.004344843051718999, |
| "count": 122 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.16355419642857144, |
| "min": 0.16355419642857144, |
| "max": 0.19982806875000003, |
| "count": 122 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 2.2897587500000003, |
| "min": 1.5986245500000003, |
| "max": 2.9482809999999997, |
| "count": 122 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.006359064223214286, |
| "min": 0.006359064223214286, |
| "max": 0.009982824068125, |
| "count": 122 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.089026899125, |
| "min": 0.079862592545, |
| "max": 0.14483327189999998, |
| "count": 122 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.005936332046985626, |
| "min": 0.004931471310555935, |
| "max": 0.4128558039665222, |
| "count": 122 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.08310864865779877, |
| "min": 0.06904059648513794, |
| "max": 3.3028464317321777, |
| "count": 122 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 219.70422535211267, |
| "min": 209.50335570469798, |
| "max": 999.0, |
| "count": 122 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 31198.0, |
| "min": 17241.0, |
| "max": 33288.0, |
| "count": 122 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.7662042135398992, |
| "min": -0.9998375526629388, |
| "max": 1.7904966305566314, |
| "count": 122 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 250.8009983226657, |
| "min": -31.994801685214043, |
| "max": 266.7839979529381, |
| "count": 122 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.7662042135398992, |
| "min": -0.9998375526629388, |
| "max": 1.7904966305566314, |
| "count": 122 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 250.8009983226657, |
| "min": -31.994801685214043, |
| "max": 266.7839979529381, |
| "count": 122 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.013619337259665949, |
| "min": 0.012362895060184254, |
| "max": 7.913583682643043, |
| "count": 122 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 1.9339458908725646, |
| "min": 1.4416112098260783, |
| "max": 142.44450628757477, |
| "count": 122 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 122 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 122 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1739869001", |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.6.0+cu124", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1739878292" |
| }, |
| "total": 9291.524195393, |
| "count": 1, |
| "self": 0.43623197300075844, |
| "children": { |
| "run_training.setup": { |
| "total": 0.020223127999997814, |
| "count": 1, |
| "self": 0.020223127999997814 |
| }, |
| "TrainerController.start_learning": { |
| "total": 9291.067740292, |
| "count": 1, |
| "self": 5.804042537143687, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.1362516149997646, |
| "count": 1, |
| "self": 2.1362516149997646 |
| }, |
| "TrainerController.advance": { |
| "total": 9282.989205800854, |
| "count": 238432, |
| "self": 6.2579750178319955, |
| "children": { |
| "env_step": { |
| "total": 6747.465627329957, |
| "count": 238432, |
| "self": 6151.05580353647, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 592.8423387924167, |
| "count": 238432, |
| "self": 18.244956292917777, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 574.597382499499, |
| "count": 229194, |
| "self": 574.597382499499 |
| } |
| } |
| }, |
| "workers": { |
| "total": 3.567485001069599, |
| "count": 238431, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 9271.431817764855, |
| "count": 238431, |
| "is_parallel": true, |
| "self": 3567.7752929374146, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.002045645999714907, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006433420003304491, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014023039993844577, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014023039993844577 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.049226441999962844, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005485129995577154, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0004293410001992015, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004293410001992015 |
| }, |
| "communicator.exchange": { |
| "total": 0.04660117299999911, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04660117299999911 |
| }, |
| "steps_from_proto": { |
| "total": 0.00164741500020682, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00035003499942831695, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.001297380000778503, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.001297380000778503 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 5703.65652482744, |
| "count": 238430, |
| "is_parallel": true, |
| "self": 120.29463871310145, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 85.7308391218885, |
| "count": 238430, |
| "is_parallel": true, |
| "self": 85.7308391218885 |
| }, |
| "communicator.exchange": { |
| "total": 5130.3556073194, |
| "count": 238430, |
| "is_parallel": true, |
| "self": 5130.3556073194 |
| }, |
| "steps_from_proto": { |
| "total": 367.2754396730493, |
| "count": 238430, |
| "is_parallel": true, |
| "self": 77.79098153192172, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 289.48445814112756, |
| "count": 1907440, |
| "is_parallel": true, |
| "self": 289.48445814112756 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 2529.2656034530646, |
| "count": 238431, |
| "self": 11.475616490120501, |
| "children": { |
| "process_trajectory": { |
| "total": 493.2178023559363, |
| "count": 238431, |
| "self": 492.2649174819371, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.95288487399921, |
| "count": 7, |
| "self": 0.95288487399921 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 2024.5721846070078, |
| "count": 1722, |
| "self": 1103.3897381675624, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 921.1824464394454, |
| "count": 83589, |
| "self": 921.1824464394454 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.341000825050287e-06, |
| "count": 1, |
| "self": 1.341000825050287e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.13823899800081563, |
| "count": 1, |
| "self": 0.002238256001874106, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.13600074199894152, |
| "count": 1, |
| "self": 0.13600074199894152 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |