| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.7945910096168518, |
| "min": 0.7279884219169617, |
| "max": 1.477802038192749, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 24053.859375, |
| "min": 21618.34375, |
| "max": 44830.6015625, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989888.0, |
| "min": 29936.0, |
| "max": 989888.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989888.0, |
| "min": 29936.0, |
| "max": 989888.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.177419051527977, |
| "min": -0.09949477761983871, |
| "max": 0.31257808208465576, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 44.70960235595703, |
| "min": -24.077735900878906, |
| "max": 82.83319091796875, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": -9.262030601501465, |
| "min": -9.674857139587402, |
| "max": 0.3218729794025421, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": -2334.03173828125, |
| "min": -2476.763427734375, |
| "max": 83.68697357177734, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06952561540605358, |
| "min": 0.06507565919750079, |
| "max": 0.07300530304327309, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.97335861568475, |
| "min": 0.48709853741038595, |
| "max": 1.039012470835587, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 21.92978182948959, |
| "min": 4.787212734434234e-05, |
| "max": 21.92978182948959, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 307.0169456128542, |
| "min": 0.0006223376554764504, |
| "max": 307.0169456128542, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.768361696292855e-06, |
| "min": 7.768361696292855e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00010875706374809997, |
| "min": 0.00010875706374809997, |
| "max": 0.0036090153969948993, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10258942142857144, |
| "min": 0.10258942142857144, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4362519000000002, |
| "min": 1.3886848, |
| "max": 2.5690767, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00026868320071428566, |
| "min": 0.00026868320071428566, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.003761564809999999, |
| "min": 0.003761564809999999, |
| "max": 0.12031020949, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.006236549932509661, |
| "min": 0.006236549932509661, |
| "max": 0.3460303246974945, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.08731169998645782, |
| "min": 0.08731169998645782, |
| "max": 2.4222123622894287, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 638.7441860465116, |
| "min": 481.1774193548387, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 27466.0, |
| "min": 16863.0, |
| "max": 32337.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 0.8494883401449337, |
| "min": -0.9999290848931959, |
| "max": 1.2673694731320364, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 36.52799862623215, |
| "min": -30.99780163168907, |
| "max": 77.92439848184586, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 0.8494883401449337, |
| "min": -0.9999290848931959, |
| "max": 1.2673694731320364, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 36.52799862623215, |
| "min": -30.99780163168907, |
| "max": 77.92439848184586, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.042039520312797785, |
| "min": 0.03562061621351094, |
| "max": 6.4404986272839935, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 1.8076993734503048, |
| "min": 1.8076993734503048, |
| "max": 109.4884766638279, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1736262948", |
| "python_version": "3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.5.1+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1736266466" |
| }, |
| "total": 3518.0058308730004, |
| "count": 1, |
| "self": 0.6387325229998169, |
| "children": { |
| "run_training.setup": { |
| "total": 0.08458571400001347, |
| "count": 1, |
| "self": 0.08458571400001347 |
| }, |
| "TrainerController.start_learning": { |
| "total": 3517.2825126360003, |
| "count": 1, |
| "self": 2.873206658946401, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 3.084093101999997, |
| "count": 1, |
| "self": 3.084093101999997 |
| }, |
| "TrainerController.advance": { |
| "total": 3511.2329150440532, |
| "count": 63404, |
| "self": 2.9549277619958048, |
| "children": { |
| "env_step": { |
| "total": 2294.8175096110344, |
| "count": 63404, |
| "self": 2091.9090794200383, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 201.22669548900944, |
| "count": 63404, |
| "self": 8.240255661963602, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 192.98643982704584, |
| "count": 62567, |
| "self": 192.98643982704584 |
| } |
| } |
| }, |
| "workers": { |
| "total": 1.6817347019866702, |
| "count": 63404, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 3509.0422792578947, |
| "count": 63404, |
| "is_parallel": true, |
| "self": 1628.9950819799283, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0036418350000531063, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0011698420005359367, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0024719929995171697, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0024719929995171697 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.10704589700003453, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0009220219999406254, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0006511740000405553, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006511740000405553 |
| }, |
| "communicator.exchange": { |
| "total": 0.1031088180000097, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.1031088180000097 |
| }, |
| "steps_from_proto": { |
| "total": 0.002363883000043643, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005069949997960066, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0018568880002476362, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0018568880002476362 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1880.0471972779665, |
| "count": 63403, |
| "is_parallel": true, |
| "self": 55.67691683320163, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 33.45732223491541, |
| "count": 63403, |
| "is_parallel": true, |
| "self": 33.45732223491541 |
| }, |
| "communicator.exchange": { |
| "total": 1649.0304935789025, |
| "count": 63403, |
| "is_parallel": true, |
| "self": 1649.0304935789025 |
| }, |
| "steps_from_proto": { |
| "total": 141.88246463094697, |
| "count": 63403, |
| "is_parallel": true, |
| "self": 31.425059455740666, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 110.4574051752063, |
| "count": 507224, |
| "is_parallel": true, |
| "self": 110.4574051752063 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1213.460477671023, |
| "count": 63404, |
| "self": 5.657545483058584, |
| "children": { |
| "process_trajectory": { |
| "total": 195.57201219895865, |
| "count": 63404, |
| "self": 195.25629988395917, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.31571231499947316, |
| "count": 2, |
| "self": 0.31571231499947316 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 1012.2309199890058, |
| "count": 451, |
| "self": 399.00318520610585, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 613.2277347828999, |
| "count": 22758, |
| "self": 613.2277347828999 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.3960006981506012e-06, |
| "count": 1, |
| "self": 1.3960006981506012e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.09229643500020757, |
| "count": 1, |
| "self": 0.0037344009997468675, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.0885620340004607, |
| "count": 1, |
| "self": 0.0885620340004607 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |