| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 1.0541887283325195, |
| "min": 1.0541887283325195, |
| "max": 1.6094080209732056, |
| "count": 25 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 2158.978515625, |
| "min": 1833.224609375, |
| "max": 3296.067626953125, |
| "count": 25 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 49988.0, |
| "min": 1984.0, |
| "max": 49988.0, |
| "count": 25 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 49988.0, |
| "min": 1984.0, |
| "max": 49988.0, |
| "count": 25 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": -0.05214060842990875, |
| "min": -0.0790453627705574, |
| "max": 0.06703026592731476, |
| "count": 25 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": -1.66849946975708, |
| "min": -2.6922693252563477, |
| "max": 2.0779383182525635, |
| "count": 25 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 9.569377899169922, |
| "min": -0.018739579245448112, |
| "max": 10.16330337524414, |
| "count": 25 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 306.2200927734375, |
| "min": -0.5809269547462463, |
| "max": 368.16986083984375, |
| "count": 25 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 25 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 25 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.04542937591947891, |
| "min": 0.04542937591947891, |
| "max": 0.05563530861400068, |
| "count": 10 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.04542937591947891, |
| "min": 0.04542937591947891, |
| "max": 0.05563530861400068, |
| "count": 10 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.21214669170203032, |
| "min": 0.21214669170203032, |
| "max": 8.107888515790304, |
| "count": 10 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.21214669170203032, |
| "min": 0.21214669170203032, |
| "max": 8.107888515790304, |
| "count": 10 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 6.216097927999988e-06, |
| "min": 6.216097927999988e-06, |
| "max": 0.00026928001024, |
| "count": 10 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 6.216097927999988e-06, |
| "min": 6.216097927999988e-06, |
| "max": 0.00026928001024, |
| "count": 10 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10207199999999995, |
| "min": 0.10207199999999995, |
| "max": 0.18975999999999998, |
| "count": 10 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 0.10207199999999995, |
| "min": 0.10207199999999995, |
| "max": 0.18975999999999998, |
| "count": 10 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00011339279999999979, |
| "min": 0.00011339279999999979, |
| "max": 0.004489024, |
| "count": 10 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.00011339279999999979, |
| "min": 0.00011339279999999979, |
| "max": 0.004489024, |
| "count": 10 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.35717928409576416, |
| "min": 0.35717928409576416, |
| "max": 1.3651211261749268, |
| "count": 10 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.35717928409576416, |
| "min": 0.35717928409576416, |
| "max": 1.3651211261749268, |
| "count": 10 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 999.0, |
| "min": 619.0, |
| "max": 999.0, |
| "count": 4 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 14985.0, |
| "min": 619.0, |
| "max": 15984.0, |
| "count": 4 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": -1.0000000447034836, |
| "min": -1.0000000447034836, |
| "max": 1.3809999898076057, |
| "count": 6 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": -15.000000670552254, |
| "min": -15.000000670552254, |
| "max": 1.3809999898076057, |
| "count": 6 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": -1.0000000447034836, |
| "min": -1.0000000447034836, |
| "max": 1.3809999898076057, |
| "count": 6 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": -15.000000670552254, |
| "min": -15.000000670552254, |
| "max": 1.3809999898076057, |
| "count": 6 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 84.27403333981832, |
| "min": 66.98070955276489, |
| "max": 272.6755060036977, |
| "count": 6 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 1264.1105000972748, |
| "min": 66.98070955276489, |
| "max": 4090.1325900554657, |
| "count": 6 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1773035737", |
| "python_version": "3.10.12 (main, Jan 26 2026, 14:55:28) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=PyramidsTraining6 --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.8.0+cu128", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1773035841" |
| }, |
| "total": 103.66781204400013, |
| "count": 1, |
| "self": 0.488246768999943, |
| "children": { |
| "run_training.setup": { |
| "total": 0.022889024000050995, |
| "count": 1, |
| "self": 0.022889024000050995 |
| }, |
| "TrainerController.start_learning": { |
| "total": 103.15667625100014, |
| "count": 1, |
| "self": 0.06532942600051683, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.2636635339999884, |
| "count": 1, |
| "self": 2.2636635339999884 |
| }, |
| "TrainerController.advance": { |
| "total": 100.6935545199999, |
| "count": 3133, |
| "self": 0.06744813999466714, |
| "children": { |
| "env_step": { |
| "total": 66.201567256006, |
| "count": 3133, |
| "self": 56.73546267200254, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 9.42420150599537, |
| "count": 3133, |
| "self": 0.2330886769996141, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 9.191112828995756, |
| "count": 3132, |
| "self": 9.191112828995756 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.04190307800809023, |
| "count": 3133, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 102.5950059210063, |
| "count": 3133, |
| "is_parallel": true, |
| "self": 51.59358566801939, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0017876499996418715, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005678990000888007, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0012197509995530709, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0012197509995530709 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04999150599996938, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005314650002219423, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0004603439997481473, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004603439997481473 |
| }, |
| "communicator.exchange": { |
| "total": 0.04718070399985663, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04718070399985663 |
| }, |
| "steps_from_proto": { |
| "total": 0.0018189930001426546, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005027259999224043, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013162670002202503, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013162670002202503 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 51.00142025298692, |
| "count": 3132, |
| "is_parallel": true, |
| "self": 1.631293846997778, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 1.1118156179863945, |
| "count": 3132, |
| "is_parallel": true, |
| "self": 1.1118156179863945 |
| }, |
| "communicator.exchange": { |
| "total": 42.98308750000797, |
| "count": 3132, |
| "is_parallel": true, |
| "self": 42.98308750000797 |
| }, |
| "steps_from_proto": { |
| "total": 5.275223287994777, |
| "count": 3132, |
| "is_parallel": true, |
| "self": 1.1024208249386902, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 4.172802463056087, |
| "count": 25056, |
| "is_parallel": true, |
| "self": 4.172802463056087 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 34.42453912399924, |
| "count": 3133, |
| "self": 0.08457219098136193, |
| "children": { |
| "process_trajectory": { |
| "total": 13.634503882018635, |
| "count": 3133, |
| "self": 10.160530354019102, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 3.473973527999533, |
| "count": 25, |
| "self": 3.473973527999533 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 20.705463050999242, |
| "count": 10, |
| "self": 12.852384412005904, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 7.853078638993338, |
| "count": 570, |
| "self": 7.853078638993338 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 8.769998203206342e-07, |
| "count": 1, |
| "self": 8.769998203206342e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.13412789399990288, |
| "count": 1, |
| "self": 0.0040049859999271575, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.13012290799997572, |
| "count": 1, |
| "self": 0.13012290799997572 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |